{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "-----------\n",
    "*日期：2023-05-10\\ week12（周三）\n",
    "*课程：Python\n",
    "*记录人：Xiao lu\n",
    "\n",
    "-----------"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 数据准备-liepin-PM"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 请求页面准备\n",
    "> 1. 找到页面的数据API接口\n",
    "> 2. 提供正确的用户请求酬载（payload）\n",
    "> 3. 准备请求的headers，增加cookie信息（用户登录之后的cookie），保证数据的合理性\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:54:32.285829Z",
     "iopub.status.busy": "2023-06-14T09:54:32.285168Z",
     "iopub.status.idle": "2023-06-14T09:54:40.114303Z",
     "shell.execute_reply": "2023-06-14T09:54:40.112953Z",
     "shell.execute_reply.started": "2023-06-14T09:54:32.285795Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "name": "stdin",
     "output_type": "stream",
     "text": [
      "请输入你要查询的职位： 产品经理\r\n"
     ]
    }
   ],
   "source": [
    "用户输入职位 = input(\"请输入你要查询的职位：\")\r\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:54:44.063647Z",
     "iopub.status.busy": "2023-06-14T09:54:44.062146Z",
     "iopub.status.idle": "2023-06-14T09:54:44.068648Z",
     "shell.execute_reply": "2023-06-14T09:54:44.067570Z",
     "shell.execute_reply.started": "2023-06-14T09:54:44.063594Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [],
   "source": [
    "城市编码 = {\r\n",
    "    '北京':'010',\r\n",
    "    '上海':'020',\r\n",
    "    '广州':'050020',\r\n",
    "    '深圳':'050090',\r\n",
    "    '香港':'320'\r\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:54:49.409717Z",
     "iopub.status.busy": "2023-06-14T09:54:49.409167Z",
     "iopub.status.idle": "2023-06-14T09:54:57.874045Z",
     "shell.execute_reply": "2023-06-14T09:54:57.872944Z",
     "shell.execute_reply.started": "2023-06-14T09:54:49.409680Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "name": "stdin",
     "output_type": "stream",
     "text": [
      "请输入你要查询的城市： 香港\r\n"
     ]
    }
   ],
   "source": [
    "用户输入城市 = input(\"请输入你要查询的城市：\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:55:01.259381Z",
     "iopub.status.busy": "2023-06-14T09:55:01.258719Z",
     "iopub.status.idle": "2023-06-14T09:55:01.570940Z",
     "shell.execute_reply": "2023-06-14T09:55:01.569811Z",
     "shell.execute_reply.started": "2023-06-14T09:55:01.259345Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'flag': 1, 'data': {'data': {'jobCardList': [{'job': {'labels': ['金融产品', '征信行业', '金融行业', '金融理财/贷款', '批发/零售', '产品优化', '产品设计', '用户研究', '交互设计', '团队管理'], 'jobKind': '2', 'dataPromId': 'd_sfrom=search_prime&d_ckId=null&d_curPage=0&d_pageSize=40&d_headId=null&d_posi=0&skId=h2c8pxojavrmo1w785z7ueih2ybfpux8&fkId=h2c8pxojavrmo1w785z7ueih2ybfpux8&ckId=h2c8pxojavrmo1w785z7ueih2ybfpux8&sfrom=search_job_pc&curPage=0&pageSize=40&index=0', 'jobId': '51880109', 'refreshTime': '20221118143443', 'advViewFlag': False, 'topJob': False, 'title': '产品经理 Product Manager', 'salary': '薪资面议', 'dq': '香港-观塘区', 'link': 'https://www.liepin.com/job/1951880109.shtml', 'pcOuterLink': '', 'h5OuterLink': '', 'requireWorkYears': '3-5年', 'requireEduLevel': '统招本科'}, 'recruiter': {'chatted': False, 'recruiterName': '邓女士', 'recruiterTitle': '人力资源经理/主管', 'recruiterId': '07bc072f44dc45b06882c0069b0a733a', 'imId': '9edddce19a93df8ae7b657921b02bb93', 'imUserType': '2', 'recruiterPhoto': '5f8f9866dfb13a7dee342f1808u.jpg'}, 'comp'\r\n"
     ]
    }
   ],
   "source": [
    "import requests\r\n",
    "import json\r\n",
    "\r\n",
    "url = \"https://apic.liepin.com/api/com.liepin.searchfront4c.pc-search-job\"\r\n",
    "payload = {\r\n",
    "    \"data\": {\r\n",
    "        \"mainSearchPcConditionForm\": {\r\n",
    "            \"city\": 城市编码[用户输入城市],\r\n",
    "            \"dq\":城市编码[用户输入城市],\r\n",
    "            \"pubTime\": \"\",\r\n",
    "            \"currentPage\": 0,\r\n",
    "            \"pageSize\": 40,\r\n",
    "            \"key\": 用户输入职位,\r\n",
    "            \"suggestTag\": \"\",\r\n",
    "            \"workYearCode\": \"0\",\r\n",
    "            \"compId\": \"\",\r\n",
    "            \"compName\": \"\",\r\n",
    "            \"compTag\": \"\",\r\n",
    "            \"industry\": \"\",\r\n",
    "            \"salary\": \"\",\r\n",
    "            \"jobKind\": \"\",\r\n",
    "            \"compScale\": \"\",\r\n",
    "            \"compKind\": \"\",\r\n",
    "            \"compStage\": \"\",\r\n",
    "            \"eduLevel\": \"\"\r\n",
    "        },\r\n",
    "        \"passThroughForm\": {\r\n",
    "            \"scene\": \"input\",\r\n",
    "            \"skId\": \"\",\r\n",
    "            \"fkId\": \"\",\r\n",
    "            \"ckId\": \"h2c8pxojavrmo1w785z7ueih2ybfpux8\",\r\n",
    "            \"suggest\": None\r\n",
    "        }\r\n",
    "    }\r\n",
    "}\r\n",
    "\r\n",
    "# set the headers\r\n",
    "headers = {\r\n",
    "    'Accept': 'application/json, text/plain, */*',\r\n",
    "    'Accept-Encoding': 'gzip, deflate, br',\r\n",
    "    'Accept-Language': 'zh-CN,zh;q=0.9',\r\n",
    "    'Cache-Control': 'no-cache',\r\n",
    "    'Connection': 'keep-alive',\r\n",
    "    'Content-Length': '412',\r\n",
    "    'Content-Type': 'application/json;charset=UTF-8;',\r\n",
    "    'Cookie':'inited_user=daf7251f92024e8969feb28b0e9ad34c; __gc_id=0baa2ddaa7774d8fba2b9c2c3d8ba166; __uuid=1670205465393.76; XSRF-TOKEN=OVqXA451Rvu03i2g23d3hg; _ga=GA1.1.834012103.1686136237; __tlog=1686136240500.91%7C00000000%7C00000000%7C00000000%7C00000000; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1686136241; acw_tc=276082a116861362414224793ed019a8d6296b0fc2aa4a904f2a48999124ae; UniqueKey=95507c72a8d5ae141a667e00ad0d9493; liepin_login_valid=0; lt_auth=6ekNMnQGxlzxtXfR3zQN4vociI39UWvIpX8EhE0Ahoe%2BCqG04PngSwOGq7EExAMhx09wc8ULN7j4NOv4ynNK7UUawGqnl4CyvOW92GECS%2BJcN8W2vezHl8zRQpQcl0AC8nFbtkIL%2BQ%3D%3D; access_system=C; user_roles=0; user_photo=5f8fa3a679c7cc70efbf444e08u.png; user_name=%E8%AE%B8%E6%99%BA%E8%B6%85; need_bind_tel=false; new_user=false; c_flag=fa43f4d55f3df63a96a7b4f194e214d4; inited_user=daf7251f92024e8969feb28b0e9ad34c; imId=c5f9b89f8466dffe6882ca1e5431db9c; imId_0=c5f9b89f8466dffe6882ca1e5431db9c; imClientId=c5f9b89f8466dffeb1921abcfab3aed0; imClientId_0=c5f9b89f8466dffeb1921abcfab3aed0; imApp_0=1; __session_seq=3; __uv_seq=3; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1686136313; fe_im_socketSequence_new_0=2_2_2; fe_im_opened_pages=; fe_im_connectJson_0=%7B%220_95507c72a8d5ae141a667e00ad0d9493%22%3A%7B%22socketConnect%22%3A%222%22%2C%22connectDomain%22%3A%22liepin.com%22%7D%7D; _ga_54YTJKWN86=GS1.1.1686136237.1.1.1686136324.0.0.0' ,\r\n",
    "    'Host': 'apic.liepin.com',\r\n",
    "    'Origin': 'https://www.liepin.com',\r\n",
    "    'Pragma': 'no-cache',\r\n",
    "    'Referer': 'https://www.liepin.com/',\r\n",
    "    'sec-ch-ua': '\"Google Chrome\";v=\"111\", \"Not(A:Brand\";v=\"8\", \"Chromium\";v=\"111\"',\r\n",
    "    'sec-ch-ua-mobile': '?0',\r\n",
    "    'sec-ch-ua-platform': '\"Windows\"',\r\n",
    "    'Sec-Fetch-Dest': 'empty',\r\n",
    "    'Sec-Fetch-Mode': 'cors',\r\n",
    "    'Sec-Fetch-Site': 'same-site',\r\n",
    "    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/105.0.0.0 Safari/537.36',\r\n",
    "    'X-Client-Type': 'web',\r\n",
    "    'X-Fscp-Bi-Stat': '{\"location\": \"https://www.liepin.com/zhaopin/?inputFrom=www_index&workYearCode=0&key=%E4%BA%A7%E5%93%81%E7%BB%8F%E7%90%86&scene=input&ckId=htihov8m2frxgy6ywo2wsg2gncnydzlb&dq=\"}',\r\n",
    "    'X-Fscp-Fe-Version': '',\r\n",
    "    'X-Fscp-Std-Info': '{\"client_id\": \"40108\"}',\r\n",
    "    'X-Fscp-Trace-Id': 'efb01166-77db-44f8-8596-3aadd07423a6',\r\n",
    "    'X-Fscp-Version': '1.1',\r\n",
    "    'X-Requested-With': 'XMLHttpRequest',\r\n",
    "    'X-XSRF-TOKEN': 'OVqXA451Rvu03i2g23d3hg'\r\n",
    "}\r\n",
    "\r\n",
    "# send a POST request with headers\r\n",
    "r = requests.post(url, data=json.dumps(payload), headers=headers)\r\n",
    "\r\n",
    "# extract the JSON data from the response\r\n",
    "response_data = r.json()\r\n",
    "\r\n",
    "# example: print the number of job postings returned\r\n",
    "print(response_data)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 翻页获取数据\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T08:58:29.321341Z",
     "iopub.status.busy": "2023-06-14T08:58:29.320501Z",
     "iopub.status.idle": "2023-06-14T08:58:30.223740Z",
     "shell.execute_reply": "2023-06-14T08:58:30.222293Z",
     "shell.execute_reply.started": "2023-06-14T08:58:29.321294Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'flag': 1, 'data': {'data': {'jobCardList': [{'job': {'labels': ['金融产品', '征信行业', '金融行业', '金融理财/贷款', '批发/零售', '产品优化', '产品设计', '用户研究', '交互设计', '团队管理'], 'salary': '薪资面议', 'dq': '香港-观塘区', 'requireWorkYears': '3-5年', 'refreshTime': '20221118143443', 'jobId': '51880109', 'jobKind': '2', 'topJob': False, 'advViewFlag': False, 'title': '产品经理 Product Manager', 'link': 'https://www.liepin.com/job/1951880109.shtml', 'dataPromId': 'd_sfrom=search_prime&d_ckId=null&d_curPage=0&d_pageSize=40&d_headId=null&d_posi=0&skId=h2c8pxojavrmo1w785z7ueih2ybfpux8&fkId=h2c8pxojavrmo1w785z7ueih2ybfpux8&ckId=h2c8pxojavrmo1w785z7ueih2ybfpux8&sfrom=search_job_pc&curPage=0&pageSize=40&index=0', 'pcOuterLink': '', 'h5OuterLink': '', 'requireEduLevel': '统招本科'}, 'dataInfo': '%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2ybfpux8%22%2C%22scene%22%3A%22input%22%2C%22skId%22%3A%22h2c8pxojavrmo1w785z7ueih2ybfpux8%22%2C%22fkId%22%3A%22h2c8pxojavrmo1w785z7ueih2ybfpux8%22%2C%22jobId%22%3A%2251880109%22%2C%22pageSize%22%3A%2240%2\r\n",
      "{'flag': 1, 'data': {'data': {'jobCardList': [{'dataParams': '{\"jobId\":\"45171269\",\"recruiterName\":\"陈女士\",\"imId\":\"0340e4988b0b521224eff958a002fd93\",\"imUserType\":\"2\",\"userId\":\"4f3dc3179f60132febf15e5f94b9c8cd\",\"jobKind\":\"1\",\"recruiterPhoto\":\"6316e8a847115a35510f5f0405u.jpg\"}', 'job': {'labels': ['CRM软件', '需求确认', '营销项目', 'CRM系统'], 'jobId': '45171269', 'salary': '35-55k', 'dq': '香港', 'refreshTime': '20230411100837', 'title': '数字化产品经理', 'jobKind': '1', 'topJob': False, 'link': 'https://www.liepin.com/a/45171269.shtml', 'requireWorkYears': '5-10年', 'advViewFlag': False, 'dataPromId': 'd_sfrom=search_prime&d_ckId=null&d_curPage=1&d_pageSize=40&d_headId=null&d_posi=0&skId=h2c8pxojavrmo1w785z7ueih2ybfpux8&fkId=h2c8pxojavrmo1w785z7ueih2ybfpux8&ckId=h2c8pxojavrmo1w785z7ueih2ybfpux8&sfrom=search_job_pc&curPage=1&pageSize=40&index=0', 'requireEduLevel': '学历不限'}, 'recruiter': {'recruiterName': '陈女士', 'recruiterTitle': '猎头顾问', 'imId': '0340e4988b0b521224eff958a002fd93', 'imUserType': '2', 'chatted': F\r\n",
      "{'flag': 1, 'data': {'data': {'jobCardList': [{'dataParams': '{\"recruiterName\":\"谢女士\",\"imId\":\"e39bf1a7adbdc6879809d03804875792\",\"imUserType\":\"2\",\"jobKind\":\"1\",\"jobId\":\"45988881\",\"userId\":\"763ec2919c35c6a833d9d464c271fc44\",\"recruiterPhoto\":\"6136e2286922c96d6db166a303u.png\"}', 'job': {'labels': ['项目工程师', '香港工作', '土木工程', '结构工程'], 'jobKind': '1', 'title': '\\xa090M0116548项目工程师(base 香港）', 'salary': '20-30k', 'dq': '香港', 'refreshTime': '20230510114027', 'jobId': '45988881', 'dataPromId': 'd_sfrom=search_prime&d_ckId=null&d_curPage=2&d_pageSize=40&d_headId=null&d_posi=0&skId=h2c8pxojavrmo1w785z7ueih2ybfpux8&fkId=h2c8pxojavrmo1w785z7ueih2ybfpux8&ckId=h2c8pxojavrmo1w785z7ueih2ybfpux8&sfrom=search_job_pc&curPage=2&pageSize=40&index=0', 'topJob': False, 'link': 'https://www.liepin.com/a/45988881.shtml', 'advViewFlag': False, 'requireEduLevel': '本科及以上', 'requireWorkYears': '3-5年'}, 'recruiter': {'recruiterName': '谢女士', 'recruiterTitle': '猎头顾问', 'imId': 'e39bf1a7adbdc6879809d03804875792', 'imUserType\r\n",
      "{'flag': 1, 'data': {'data': {}, 'passThroughData': {'ckId': 'h2c8pxojavrmo1w785z7ueih2ybfpux8', 'scene': 'input', 'skId': 'h2c8pxojavrmo1w785z7ueih2ybfpux8', 'fkId': 'h2c8pxojavrmo1w785z7ueih2ybfpux8', 'sfrom': 'search_job_pc'}, 'pagination': {'currentPage': 3, 'totalCounts': 0, 'pageSize': 40, 'totalPage': 0, 'hasNext': False}}}\r\n"
     ]
    },
    {
     "ename": "KeyError",
     "evalue": "'jobCardList'",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mKeyError\u001b[0m                                  Traceback (most recent call last)",
      "\u001b[0;32m/tmp/ipykernel_5040/1507514389.py\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m      9\u001b[0m     \u001b[0mresponse_data\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mr\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjson\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     10\u001b[0m     \u001b[0mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mresponse_data\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 11\u001b[0;31m     \u001b[0mdf\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjson_normalize\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mresponse_data\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'data'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'data'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'jobCardList'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     12\u001b[0m     \u001b[0mresponse_df\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mappend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
      "\u001b[0;31mKeyError\u001b[0m: 'jobCardList'"
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "response_df = []\n",
    "for i in range(21):\n",
    "    payload['data']['mainSearchPcConditionForm']['currentPage']=i\n",
    "    # send a POST request with headers\n",
    "    r = requests.post(url, data=json.dumps(payload), headers=headers)\n",
    "\n",
    "    # extract the JSON data from the response\n",
    "    response_data = r.json()\n",
    "    print(response_data)\n",
    "    df = pd.json_normalize(response_data['data']['data']['jobCardList'])\n",
    "    response_df.append(df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T08:59:21.399746Z",
     "iopub.status.busy": "2023-06-14T08:59:21.399022Z",
     "iopub.status.idle": "2023-06-14T08:59:21.494552Z",
     "shell.execute_reply": "2023-06-14T08:59:21.493137Z",
     "shell.execute_reply.started": "2023-06-14T08:59:21.399706Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[                                             dataInfo  \\\n",
       " 0   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 1   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 2   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 3   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 4   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 5   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 6   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 7   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 8   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 9   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 10  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 11  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 12  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 13  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 14  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 15  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 16  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 17  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 18  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 19  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 20  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 21  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 22  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 23  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 24  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 25  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 26  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 27  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 28  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 29  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 30  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 31  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 32  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 33  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 34  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 35  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 36  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 37  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 38  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 39  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " \n",
       "                                            dataParams  \\\n",
       " 0   {\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...   \n",
       " 1   {\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...   \n",
       " 2   {\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...   \n",
       " 3   {\"userId\":\"1efac136cbe60a32a3ebc0e282cc3953\",\"...   \n",
       " 4   {\"userId\":\"8aca73f4bae4fc17102021541d30443c\",\"...   \n",
       " 5   {\"userId\":\"81fe889034bcaad777e6dcdcf1ccb74d\",\"...   \n",
       " 6   {\"userId\":\"60aa21ab3fe77c74f7964ecba50473f1\",\"...   \n",
       " 7   {\"userId\":\"435fd20952d5471977265bfed7712363\",\"...   \n",
       " 8   {\"userId\":\"320a86d5d4dcb150549c017a70b4d785\",\"...   \n",
       " 9   {\"userId\":\"c94d41b5875c19b514003927d0b811f0\",\"...   \n",
       " 10  {\"userId\":\"81fe889034bcaad777e6dcdcf1ccb74d\",\"...   \n",
       " 11  {\"userId\":\"7fd011c520a166d9a7e2465e724eded9\",\"...   \n",
       " 12  {\"userId\":\"665abaa54b64a2a10820b94a0ead5d88\",\"...   \n",
       " 13  {\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...   \n",
       " 14  {\"userId\":\"7705f15f9d97b5179219e7c34b570890\",\"...   \n",
       " 15  {\"userId\":\"bf56f38818e707ef0c37f8e61680451b\",\"...   \n",
       " 16  {\"userId\":\"e706daa5965eddf392b75fe4e3afd042\",\"...   \n",
       " 17  {\"userId\":\"472cc3a9ee970e3ea7069dd1f9b4f0ec\",\"...   \n",
       " 18  {\"userId\":\"94fde39adebf90340caabbe82932c5d0\",\"...   \n",
       " 19  {\"userId\":\"eadecc94dbac89033e4a55fe73fc2fd7\",\"...   \n",
       " 20  {\"userId\":\"63e4eeb8e577e92f7c8c7ef7b6ae2c0e\",\"...   \n",
       " 21  {\"userId\":\"56362c7d170e1090f265d258de4e4be8\",\"...   \n",
       " 22  {\"userId\":\"571f4182d2e63db67aed0b08ee27d5f8\",\"...   \n",
       " 23  {\"userId\":\"54aebe2b86874dac40a35a6faa871265\",\"...   \n",
       " 24  {\"userId\":\"571f4182d2e63db67aed0b08ee27d5f8\",\"...   \n",
       " 25  {\"userId\":\"571f4182d2e63db67aed0b08ee27d5f8\",\"...   \n",
       " 26  {\"userId\":\"b01dfeb6aac4dfca7aaf2cf99ccd846c\",\"...   \n",
       " 27  {\"userId\":\"5540ec557f9c318ea4cd2d419081aa73\",\"...   \n",
       " 28  {\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...   \n",
       " 29  {\"userId\":\"b0483e58237f0c40811c317f6ce9f5b5\",\"...   \n",
       " 30  {\"userId\":\"571f4182d2e63db67aed0b08ee27d5f8\",\"...   \n",
       " 31  {\"userId\":\"2bdfd525f33baeb4bbc0f46f65179d0d\",\"...   \n",
       " 32  {\"userId\":\"9821aff1bffb45839d4710e93bacf4e5\",\"...   \n",
       " 33  {\"userId\":\"571f4182d2e63db67aed0b08ee27d5f8\",\"...   \n",
       " 34  {\"userId\":\"881b2d6cf4d7bf527379bd0cc1beaffa\",\"...   \n",
       " 35  {\"userId\":\"d5edf200a68183f18dc7b1298e13a96e\",\"...   \n",
       " 36  {\"userId\":\"571f4182d2e63db67aed0b08ee27d5f8\",\"...   \n",
       " 37  {\"userId\":\"6ac872ec192e19de9e494083d5c4c6b7\",\"...   \n",
       " 38  {\"userId\":\"f09669d38e90f5150e7cbcc316046c74\",\"...   \n",
       " 39  {\"userId\":\"571f4182d2e63db67aed0b08ee27d5f8\",\"...   \n",
       " \n",
       "                                            job.labels    job.salary  job.dq  \\\n",
       " 0   [金融产品, 征信行业, 金融行业, 金融理财/贷款, 批发/零售, 产品优化, 产品设计,...          薪资面议  香港-观塘区   \n",
       " 1                  [IT互联网, SaaS产品, to B, 产品设计, 移动端产品]        25-40k  香港-观塘区   \n",
       " 2                                                  []        40-60k  香港-观塘区   \n",
       " 3                                        [交易产品, 金融行业]          薪资面议  香港-中西区   \n",
       " 4                                                  []          薪资面议   香港-东区   \n",
       " 5                                                  []        40-70k  香港-中西区   \n",
       " 6                                                  []        30-60k      香港   \n",
       " 7                                                  []        30-55k      香港   \n",
       " 8                                                  []        50-55k      香港   \n",
       " 9                                            [金融产品经理]    14-40k·14薪  香港-观塘区   \n",
       " 10                                                 []    45-75k·15薪  香港-中西区   \n",
       " 11               [区块链, 产品规划, web3, 数据产品, to C, IT互联网]        25-30k  香港-葵青区   \n",
       " 12                                                 []        35-65k      香港   \n",
       " 13                                             [征信行业]        35-65k  香港-观塘区   \n",
       " 14  [金融产品, 征信行业, 金融行业, 金融理财/贷款, 批发/零售, 产品优化, 产品设计,...        15-25k      香港   \n",
       " 15                     [商业产品, 用户研究, 团队管理, 产品规划, 数据分析]        50-80k  香港-荃湾区   \n",
       " 16                                       [硬件产品, 游戏产品]        20-30k      香港   \n",
       " 17                                                 []  120-240k·30薪      香港   \n",
       " 18  [需求分析, IT互联网, 区块链, web端产品, 产品规划, 用户研究, 市场调研, 原...        30-50k      香港   \n",
       " 19  [CRM产品, 策略产品, 工具产品, 数据产品, to C, CRM系统, 广告营销, 用...        30-45k      香港   \n",
       " 20                                      [量化交易, CTA策略]          薪资面议  香港-湾仔区   \n",
       " 21                                                 []    20-40k·15薪  香港-湾仔区   \n",
       " 22      [投资产品, 工具产品, 电商产品, 通讯/网络设备, 广告营销, 电子商务, 产品优化]        22-30k  香港-葵青区   \n",
       " 23                                                 []          薪资面议  香港-中西区   \n",
       " 24                                                 []          薪资面议  香港-葵青区   \n",
       " 25                                                 []          薪资面议  香港-葵青区   \n",
       " 26                                                 []        30-60k      香港   \n",
       " 27                                                 []          薪资面议  香港-中西区   \n",
       " 28                                 [数据产品, 征信行业, 产品优化]        35-65k  香港-观塘区   \n",
       " 29                                                 []          薪资面议  香港-中西区   \n",
       " 30                                                 []        40-50k  香港-葵青区   \n",
       " 31                                                 []        20-30k      香港   \n",
       " 32                                       [产品设计, 产品规划]        30-50k      香港   \n",
       " 33                                                 []          薪资面议  香港-葵青区   \n",
       " 34                      [智能家居, 物联网, 智慧家居, 智能硬件, 照明产品]        25-45k      香港   \n",
       " 35  [金融产品, 产品经理, 投资管理, 资产管理, 财富管理, Product Manager...    30-40k·20薪      香港   \n",
       " 36               [商业产品, 云计算, 移动端产品, 用户研究, 竞品分析, 团队管理]        30-45k  香港-葵青区   \n",
       " 37                                                 []          薪资面议  香港-湾仔区   \n",
       " 38  [需求挖掘, 数据分析, 需求分析, 产品规划, 需求调研, 产品设计, 计算机软件, 通讯...    15-30k·14薪  香港-沙田区   \n",
       " 39                                                 []        35-40k  香港-西贡区   \n",
       " \n",
       "    job.requireWorkYears job.refreshTime job.jobId job.jobKind  job.topJob  \\\n",
       " 0                  3-5年  20221118143443  51880109           2       False   \n",
       " 1                 5-10年  20230602174402  58720383           2       False   \n",
       " 2                  3-5年  20230602174402  58720027           2       False   \n",
       " 3                 5-10年  20221230112638  55273999           2       False   \n",
       " 4                 10年以上  20220810153828  51789749           2       False   \n",
       " 5                 5-10年  20230206145433  55840243           2       False   \n",
       " 6                 5-10年  20230331182809  44927829           1       False   \n",
       " 7                 5-10年  20230413145802  45274199           1       False   \n",
       " 8                  经验不限  20230508100942  44905303           1       False   \n",
       " 9                  3-5年  20230321145120  46695121           2       False   \n",
       " 10                5-10年  20230201164843  55712575           2       False   \n",
       " 11                5-10年  20230602105010  56823423           2       False   \n",
       " 12                 经验不限  20230614104154  46851031           1       False   \n",
       " 13                 3-5年  20221118143443  52641025           2       False   \n",
       " 14                5-10年  20221019114143  52992431           2       False   \n",
       " 15                5-10年  20230329171035  57400757           2       False   \n",
       " 16                 3-5年  20220428111306  41773779           2       False   \n",
       " 17                 经验不限  20230614000003  46681881           1       False   \n",
       " 18                 3-5年  20230613150326  45094373           1       False   \n",
       " 19                5-10年  20230614091839  45018467           1       False   \n",
       " 20                 经验不限  20221101185646  53527459           2       False   \n",
       " 21                 3-5年  20230530115501  57608899           2       False   \n",
       " 22                 3-5年  20221222102158  51771479           2       False   \n",
       " 23                 3-5年  20230518161439  54905861           2       False   \n",
       " 24                5-10年  20220624132417  50645371           2       False   \n",
       " 25                5-10年  20220624131859  50645221           2       False   \n",
       " 26                 经验不限  20230614104836  46076085           1       False   \n",
       " 27                 3-5年  20230406092245  55536541           2       False   \n",
       " 28                 3-5年  20221118143443  52640883           2       False   \n",
       " 29                 3-5年  20230614092239  56548437           2       False   \n",
       " 30                5-10年  20230614113453  59320155           2       False   \n",
       " 31                 1-3年  20230612161623  58939839           2       False   \n",
       " 32                 3-5年  20230613094815  46713347           1       False   \n",
       " 33                5-10年  20230324124715  54889143           2       False   \n",
       " 34                5-10年  20230609103322  58990437           2       False   \n",
       " 35                 3-5年  20230407004339  45072621           1       False   \n",
       " 36                5-10年  20220706123449  50914221           2       False   \n",
       " 37                 1-3年  20230207102923  55866839           2       False   \n",
       " 38                5-10年  20220916172526  52515275           2       False   \n",
       " 39                5-10年  20230331094111  57444481           2       False   \n",
       " \n",
       "     ...  recruiter.recruiterName    recruiter.recruiterTitle  \\\n",
       " 0   ...                      邓女士                   人力资源经理/主管   \n",
       " 1   ...                      李先生  Talent Acquisition Manager   \n",
       " 2   ...                      李先生  Talent Acquisition Manager   \n",
       " 3   ...                      卞女士                               \n",
       " 4   ...                      张女士                     Sourcer   \n",
       " 5   ...                      赵女士                      高级招聘经理   \n",
       " 6   ...                      熊女士                        猎头顾问   \n",
       " 7   ...                      熊先生                        猎头顾问   \n",
       " 8   ...                      吴女士                        猎头顾问   \n",
       " 9   ...                      阎女士                               \n",
       " 10  ...                      赵女士                      高级招聘经理   \n",
       " 11  ...                      谭女士                      人力招聘經理   \n",
       " 12  ...                      张女士                        猎头顾问   \n",
       " 13  ...                      邓女士                   人力资源经理/主管   \n",
       " 14  ...                      金先生                        HRBP   \n",
       " 15  ...                      赵女士                        猎头顾问   \n",
       " 16  ...                      刘女士                        业务总监   \n",
       " 17  ...                      任先生                        猎头顾问   \n",
       " 18  ...                      时女士                        猎头顾问   \n",
       " 19  ...                      黄女士                        猎头顾问   \n",
       " 20  ...                      李女士                          hr   \n",
       " 21  ...                      孔先生                   高级招聘/HRBP   \n",
       " 22  ...                      李女士                               \n",
       " 23  ...                      吴先生                      人力资源经理   \n",
       " 24  ...                      李女士                               \n",
       " 25  ...                      李女士                               \n",
       " 26  ...                      武女士                        猎头顾问   \n",
       " 27  ...                      郭先生                   人力资源经理/主管   \n",
       " 28  ...                      邓女士                   人力资源经理/主管   \n",
       " 29  ...                      吴先生                          HR   \n",
       " 30  ...                      李女士                               \n",
       " 31  ...                      黄女士                               \n",
       " 32  ...                      邓女士                        猎头顾问   \n",
       " 33  ...                      李女士                               \n",
       " 34  ...                      师先生                          HR   \n",
       " 35  ...                      陈女士                        猎头顾问   \n",
       " 36  ...                      李女士                               \n",
       " 37  ...                      张女士                        人事专员   \n",
       " 38  ...                      王女士                      行政人事经理   \n",
       " 39  ...                      李女士                               \n",
       " \n",
       "            recruiter.recruiterPhoto comp.compId comp.compScale  \\\n",
       " 0   5f8f9866dfb13a7dee342f1808u.jpg   8226823.0     2000-5000人   \n",
       " 1   61e1521019ffac3de11dd5c403u.png  13057723.0         50-99人   \n",
       " 2   61e1521019ffac3de11dd5c403u.png  13057723.0         50-99人   \n",
       " 3   5f8f9865ea60860b75384fa508u.jpg   4580900.0    5000-10000人   \n",
       " 4   5f8f9865ea60860b75384fa508u.jpg   1069385.0       10000人以上   \n",
       " 5   5f8f9866dfb13a7dee342f1808u.jpg   8622479.0     2000-5000人   \n",
       " 6   5f8fa3bddfb13a7dee343d7608u.png         NaN                  \n",
       " 7   5f8fa395dfb13a7dee343d2d08u.png         NaN                  \n",
       " 8   62b916b1b8552550b5dc281003u.jpg         NaN     2000-5000人   \n",
       " 9   5f8f9866dfb13a7dee342f1808u.jpg   9496537.0     1000-2000人   \n",
       " 10  5f8f9866dfb13a7dee342f1808u.jpg   8622479.0     2000-5000人   \n",
       " 11  5f8f9863f6d1ab58476f246a08u.jpg  13211309.0     1000-2000人   \n",
       " 12  54d0c580712e894a54c826f801a.jpg         NaN       100-499人   \n",
       " 13  5f8f9866dfb13a7dee342f1808u.jpg   8226823.0     2000-5000人   \n",
       " 14  5f8f9868f6d1ab58476f24a008u.jpg   8226823.0     2000-5000人   \n",
       " 15  5f8f98648dbe6273dcf8515508u.jpg    152511.0    5000-10000人   \n",
       " 16  5f8f9866dfb13a7dee342f1808u.jpg  12869049.0          1-49人   \n",
       " 17  63f78597514e04107e3432ec04u.png         NaN          1-49人   \n",
       " 18  5f8fa3bc8dbe6273dcf85e5e08u.png         NaN          1-49人   \n",
       " 19  608221d43846135f5300978a01u.jpg         NaN       100-499人   \n",
       " 20  5f8f986779c7cc70efbf36c008u.jpg   8177652.0         50-99人   \n",
       " 21  5f8f986c79c7cc70efbf36c808u.jpg  12899647.0       100-499人   \n",
       " 22  5f8f9865ea60860b75384fa508u.jpg   8932876.0       500-999人   \n",
       " 23  5f8f98698dbe6273dcf8516008u.jpg   8016742.0       100-499人   \n",
       " 24  5f8f9865ea60860b75384fa508u.jpg   8932876.0       500-999人   \n",
       " 25  5f8f9865ea60860b75384fa508u.jpg   8932876.0       500-999人   \n",
       " 26  5865ecc27032174cf9f93a1305a.jpg         NaN       10000人以上   \n",
       " 27  5f8f986c79c7cc70efbf36c808u.jpg   8016742.0       100-499人   \n",
       " 28  5f8f9866dfb13a7dee342f1808u.jpg   8226823.0     2000-5000人   \n",
       " 29  5f8f986c79c7cc70efbf36c808u.jpg   9791085.0       100-499人   \n",
       " 30  5f8f9865ea60860b75384fa508u.jpg   8932876.0       500-999人   \n",
       " 31  611f258c87c6945ee74812d106u.png   9329938.0       500-999人   \n",
       " 32  60a216ca071fb476257905f605u.jpg         NaN                  \n",
       " 33  5f8f9865ea60860b75384fa508u.jpg   8932876.0       500-999人   \n",
       " 34  5f8f986aea60860b75384fab08u.jpg   7893220.0       10000人以上   \n",
       " 35  5d2e9ad6dde7f0565c17697c04u.jpg         NaN       500-999人   \n",
       " 36  5f8f9865ea60860b75384fa508u.jpg   8932876.0       500-999人   \n",
       " 37  628c507d4bb5bd439707beb201u.png   6422719.0       10000人以上   \n",
       " 38  5f8f98648dbe6273dcf8515508u.jpg  13311913.0         50-99人   \n",
       " 39  5f8f9865ea60860b75384fa508u.jpg   8932876.0       500-999人   \n",
       " \n",
       "                     comp.compName comp.compStage  \\\n",
       " 0                           金融壹账通           美股上市   \n",
       " 1   KPay merchant service limited            NaN   \n",
       " 2   KPay merchant service limited            NaN   \n",
       " 3                    中国国际金融股份有限公司         沪深A股上市   \n",
       " 4                            伊顿中国            NaN   \n",
       " 5                多点生活(中国)网络科技有限公司             C轮   \n",
       " 6                     某国内基金证券上市公司            已上市   \n",
       " 7                 某国内基金/证券/期货上市公司            已上市   \n",
       " 8                   某基金/证券/期货上市公司            已上市   \n",
       " 9                    创兴银行有限公司深圳分行            NaN   \n",
       " 10               多点生活(中国)网络科技有限公司             C轮   \n",
       " 11                     中国移动香港有限公司            NaN   \n",
       " 12                   在港中资银行背景金融机构          融资未公开   \n",
       " 13                          金融壹账通           美股上市   \n",
       " 14                          金融壹账通           美股上市   \n",
       " 15                           中企动力             其他   \n",
       " 16              Tactility limited            天使轮   \n",
       " 17                          某知名公司          融资未公开   \n",
       " 18                       某深圳互联网公司            NaN   \n",
       " 19                         某餐饮业公司          融资未公开   \n",
       " 20                   上海千象资产管理有限公司            NaN   \n",
       " 21                  北京必来屋网络科技有限公司            NaN   \n",
       " 22                     中国移动国际有限公司            NaN   \n",
       " 23                       集友银行福州分行            NaN   \n",
       " 24                     中国移动国际有限公司            NaN   \n",
       " 25                     中国移动国际有限公司            NaN   \n",
       " 26                        某基金证券公司          融资未公开   \n",
       " 27                       集友银行福州分行            NaN   \n",
       " 28                          金融壹账通           美股上市   \n",
       " 29                       集友银行深圳分行            NaN   \n",
       " 30                     中国移动国际有限公司            NaN   \n",
       " 31                 上海陆浦投资管理集团有限公司            NaN   \n",
       " 32                      某深圳外包服务公司            NaN   \n",
       " 33                     中国移动国际有限公司            NaN   \n",
       " 34                             浪潮            NaN   \n",
       " 35                某北京大型基金/证券/期货公司          融资未公开   \n",
       " 36                     中国移动国际有限公司            NaN   \n",
       " 37                          新华三集团            NaN   \n",
       " 38                     耀通科技投资有限公司            NaN   \n",
       " 39                     中国移动国际有限公司            NaN   \n",
       " \n",
       "                       comp.compLogo                                 comp.link  \\\n",
       " 0   5f3ca396ea60860b75020faa02u.jpg   https://www.liepin.com/company/8226823/   \n",
       " 1   61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13057723/   \n",
       " 2   61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13057723/   \n",
       " 3   5bcd8a2f8e50a3257f7102c304a.jpg   https://www.liepin.com/company/4580900/   \n",
       " 4   5bfe9df574719d2aa34b7b2203a.png   https://www.liepin.com/company/1069385/   \n",
       " 5   5f39f2a1f6d1ab5847351ad307u.png   https://www.liepin.com/company/8622479/   \n",
       " 6   60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 7   60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 8   60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 9   5d1ae5e33fa7ce27b2a86b5906u.png   https://www.liepin.com/company/9496537/   \n",
       " 10  5f39f2a1f6d1ab5847351ad307u.png   https://www.liepin.com/company/8622479/   \n",
       " 11  62fca94128e72769b4c1d61e06u.png  https://www.liepin.com/company/13211309/   \n",
       " 12  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 13  5f3ca396ea60860b75020faa02u.jpg   https://www.liepin.com/company/8226823/   \n",
       " 14  5f3ca396ea60860b75020faa02u.jpg   https://www.liepin.com/company/8226823/   \n",
       " 15  59a7805a7032c9d2a21459c506a.jpg    https://www.liepin.com/company/152511/   \n",
       " 16  61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/12869049/   \n",
       " 17  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 18  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 19  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 20  59786e9b70327b30a4e6cdd404a.jpg   https://www.liepin.com/company/8177652/   \n",
       " 21  61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/12899647/   \n",
       " 22  5bfea51674719d2aa34cd90503a.png   https://www.liepin.com/company/8932876/   \n",
       " 23  64006e52b65d3e269b47968c08u.png   https://www.liepin.com/company/8016742/   \n",
       " 24  5bfea51674719d2aa34cd90503a.png   https://www.liepin.com/company/8932876/   \n",
       " 25  5bfea51674719d2aa34cd90503a.png   https://www.liepin.com/company/8932876/   \n",
       " 26  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 27  64006e52b65d3e269b47968c08u.png   https://www.liepin.com/company/8016742/   \n",
       " 28  5f3ca396ea60860b75020faa02u.jpg   https://www.liepin.com/company/8226823/   \n",
       " 29  6038940e60e5677feb2a609f01u.png   https://www.liepin.com/company/9791085/   \n",
       " 30  5bfea51674719d2aa34cd90503a.png   https://www.liepin.com/company/8932876/   \n",
       " 31  6340eddf5fd2f55ef5a124be02u.png   https://www.liepin.com/company/9329938/   \n",
       " 32  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 33  5bfea51674719d2aa34cd90503a.png   https://www.liepin.com/company/8932876/   \n",
       " 34  5bfe9ebf74719d2aa34ba2af03a.png   https://www.liepin.com/company/7893220/   \n",
       " 35  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       " 36  5bfea51674719d2aa34cd90503a.png   https://www.liepin.com/company/8932876/   \n",
       " 37  5bfea09e74719d2aa34bffc203a.png   https://www.liepin.com/company/6422719/   \n",
       " 38  61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13311913/   \n",
       " 39  5bfea51674719d2aa34cd90503a.png   https://www.liepin.com/company/8932876/   \n",
       " \n",
       "    comp.compIndustry  \n",
       " 0               科技金融  \n",
       " 1               科技金融  \n",
       " 2               科技金融  \n",
       " 3           基金/证券/期货  \n",
       " 4              机械/设备  \n",
       " 5               电子商务  \n",
       " 6           基金/证券/期货  \n",
       " 7           基金/证券/期货  \n",
       " 8           基金/证券/期货  \n",
       " 9                 银行  \n",
       " 10              电子商务  \n",
       " 11          运营商/增值服务  \n",
       " 12          基金/证券/投资  \n",
       " 13              科技金融  \n",
       " 14              科技金融  \n",
       " 15              电子商务  \n",
       " 16              智能硬件  \n",
       " 17          基金/证券/期货  \n",
       " 18               互联网  \n",
       " 19               餐饮业  \n",
       " 20          基金/证券/期货  \n",
       " 21               互联网  \n",
       " 22              通信设备  \n",
       " 23                银行  \n",
       " 24              通信设备  \n",
       " 25              通信设备  \n",
       " 26          基金/证券/期货  \n",
       " 27                银行  \n",
       " 28              科技金融  \n",
       " 29                银行  \n",
       " 30              通信设备  \n",
       " 31          基金/证券/期货  \n",
       " 32           其他商务服务业  \n",
       " 33              通信设备  \n",
       " 34              IT服务  \n",
       " 35          基金/证券/期货  \n",
       " 36              通信设备  \n",
       " 37             计算机硬件  \n",
       " 38             计算机软件  \n",
       " 39              通信设备  \n",
       " \n",
       " [40 rows x 31 columns],\n",
       "                                            dataParams  \\\n",
       " 0   {\"jobId\":\"45171269\",\"recruiterName\":\"陈女士\",\"imI...   \n",
       " 1   {\"jobId\":\"55794821\",\"recruiterName\":\"寇先生\",\"imI...   \n",
       " 2   {\"jobId\":\"36919653\",\"recruiterName\":\"李女士\",\"imI...   \n",
       " 3   {\"jobId\":\"36919449\",\"recruiterName\":\"李女士\",\"imI...   \n",
       " 4   {\"jobId\":\"36919333\",\"recruiterName\":\"李女士\",\"imI...   \n",
       " 5   {\"jobId\":\"36919541\",\"recruiterName\":\"李女士\",\"imI...   \n",
       " 6   {\"jobId\":\"51789197\",\"recruiterName\":\"孙女士\",\"imI...   \n",
       " 7   {\"jobId\":\"46724441\",\"recruiterName\":\"陈女士\",\"imI...   \n",
       " 8   {\"jobId\":\"42358105\",\"recruiterName\":\"许先生\",\"imI...   \n",
       " 9   {\"jobId\":\"55540819\",\"recruiterName\":\"李先生\",\"imI...   \n",
       " 10  {\"jobId\":\"59168935\",\"recruiterName\":\"还先生\",\"imI...   \n",
       " 11  {\"jobId\":\"46477001\",\"recruiterName\":\"陈先生\",\"imI...   \n",
       " 12  {\"jobId\":\"45686459\",\"recruiterName\":\"黄先生\",\"imI...   \n",
       " 13  {\"jobId\":\"45674989\",\"recruiterName\":\"王女士\",\"imI...   \n",
       " 14  {\"jobId\":\"46006849\",\"recruiterName\":\"孙女士\",\"imI...   \n",
       " 15  {\"jobId\":\"45140215\",\"recruiterName\":\"陈女士\",\"imI...   \n",
       " 16  {\"jobId\":\"52324313\",\"recruiterName\":\"兰女士\",\"imI...   \n",
       " 17  {\"jobId\":\"52992597\",\"recruiterName\":\"金先生\",\"imI...   \n",
       " 18  {\"jobId\":\"45171567\",\"recruiterName\":\"陈女士\",\"imI...   \n",
       " 19  {\"jobId\":\"52325011\",\"recruiterName\":\"兰女士\",\"imI...   \n",
       " 20  {\"jobId\":\"58009627\",\"recruiterName\":\"张女士\",\"imI...   \n",
       " 21  {\"jobId\":\"46763687\",\"recruiterName\":\"牛先生\",\"imI...   \n",
       " 22  {\"jobId\":\"43394077\",\"recruiterName\":\"孙先生\",\"imI...   \n",
       " 23  {\"jobId\":\"46683553\",\"recruiterName\":\"张先生\",\"imI...   \n",
       " 24  {\"jobId\":\"55518261\",\"recruiterName\":\"尹女士\",\"imI...   \n",
       " 25  {\"jobId\":\"58223879\",\"recruiterName\":\"王女士\",\"imI...   \n",
       " 26  {\"jobId\":\"59131945\",\"recruiterName\":\"王女士\",\"imI...   \n",
       " 27  {\"jobId\":\"44761453\",\"recruiterName\":\"王女士\",\"imI...   \n",
       " 28  {\"jobId\":\"46850201\",\"recruiterName\":\"张女士\",\"imI...   \n",
       " 29  {\"jobId\":\"44762479\",\"recruiterName\":\"袁女士\",\"imI...   \n",
       " 30  {\"jobId\":\"57824497\",\"recruiterName\":\"陈女士\",\"imI...   \n",
       " 31  {\"jobId\":\"45790357\",\"recruiterName\":\"卢女士\",\"imI...   \n",
       " 32  {\"jobId\":\"58735393\",\"recruiterName\":\"刘女士\",\"imI...   \n",
       " 33  {\"jobId\":\"57348119\",\"recruiterName\":\"谢女士\",\"imI...   \n",
       " 34  {\"jobId\":\"58635435\",\"recruiterName\":\"张女士\",\"imI...   \n",
       " 35  {\"jobId\":\"48316303\",\"recruiterName\":\"陆女士\",\"imI...   \n",
       " 36  {\"jobId\":\"52237167\",\"recruiterName\":\"梁女士\",\"imI...   \n",
       " 37  {\"jobId\":\"53469539\",\"recruiterName\":\"李女士\",\"imI...   \n",
       " 38  {\"jobId\":\"46182495\",\"recruiterName\":\"贺女士\",\"imI...   \n",
       " 39  {\"jobId\":\"57161555\",\"recruiterName\":\"李女士\",\"imI...   \n",
       " \n",
       "                                              dataInfo  \\\n",
       " 0   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 1   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 2   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 3   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 4   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 5   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 6   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 7   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 8   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 9   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 10  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 11  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 12  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 13  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 14  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 15  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 16  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 17  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 18  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 19  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 20  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 21  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 22  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 23  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 24  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 25  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 26  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 27  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 28  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 29  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 30  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 31  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 32  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 33  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 34  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 35  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 36  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 37  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 38  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " 39  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       " \n",
       "                                            job.labels job.jobId   job.salary  \\\n",
       " 0                          [CRM软件, 需求确认, 营销项目, CRM系统]  45171269       35-55k   \n",
       " 1                                         [客户管理, RFP]  55794821       20-45k   \n",
       " 2                                                  []  36919653         薪资面议   \n",
       " 3                                              [技术支持]  36919449         薪资面议   \n",
       " 4                                              [通信领域]  36919333         薪资面议   \n",
       " 5                                              [saas]  36919541         薪资面议   \n",
       " 6                                      [ActionScript]  51789197         薪资面议   \n",
       " 7                                             [新产品导入]  46724441   25-30k·13薪   \n",
       " 8   [EHS, PPE, 安全生产, 职业卫生, 工业卫生, HSE, ESH, Process...  42358105       15-30k   \n",
       " 9                                  [HCM, 售前, 本地化, 海外]  55540819   20-35k·15薪   \n",
       " 10                                                 []  59168935         薪资面议   \n",
       " 11                                                 []  46477001         1-2k   \n",
       " 12     [基金产品总监, 基金筛选, FOF基金, 对冲基金, 结构化产品, 基金尽调, 海外基金]  45686459  70-100k·16薪   \n",
       " 13                                                 []  45674989   60-90k·16薪   \n",
       " 14                                                 []  46006849  70-100k·22薪   \n",
       " 15  [市场营销, 竞品分析, 社交媒体, 社交媒介, 营销活动, 广告/传媒/文化, IT/互联...  45140215       30-50k   \n",
       " 16                            [施工现场管理, 建筑施工, PROJECT]  52324313       15-25k   \n",
       " 17                                                 []  52992597       15-25k   \n",
       " 18  [营销策划, 品牌策划, 自媒体策划, 社交媒体, 社交媒介, 营销活动, 广告/传媒/文化...  45171567       35-55k   \n",
       " 19                               [施工现场管理, 安防工程, 建筑施工]  52325011       15-16k   \n",
       " 20                                     [ActionScript]  58009627   15-30k·13薪   \n",
       " 21                                                 []  46763687       50-80k   \n",
       " 22  [美元VC, 清华姚班, 清华智班, 清华量信班, 机器人, 人工智能研究院, AI, Op...  43394077   60-90k·15薪   \n",
       " 23                                                 []  46683553  85-100k·24薪   \n",
       " 24                                                 []  55518261       15-30k   \n",
       " 25                                             [用户运营]  58223879   25-40k·15薪   \n",
       " 26        [包装设计, UG, SolidWorks, 结构设计, 3D设计, keyshot]  59131945       40-50k   \n",
       " 27                                                 []  44761453      70-100k   \n",
       " 28                     [数据产品, 工具产品, 平台产品, 数据分析, 团队管理]  46850201       30-60k   \n",
       " 29              [平台产品, 增长产品, IT互联网, 产品设计, 用户研究, 团队管理]  44762479  70-100k·16薪   \n",
       " 30                                                 []  57824497       18-25k   \n",
       " 31                                    [对冲基金, 医疗行业分析师]  45790357   30-60k·24薪   \n",
       " 32                                       [用户运营, 产品运营]  58735393       40-60k   \n",
       " 33                                                 []  57348119   30-40k·16薪   \n",
       " 34                                                 []  58635435       40-70k   \n",
       " 35                                                 []  48316303         薪资面议   \n",
       " 36            [质量管理, 风控项目, .NET, ASP.NET, ClickHouse]  52237167       25-30k   \n",
       " 37                                             [量化私募]  53469539         薪资面议   \n",
       " 38                                             [门店销售]  46182495       15-30k   \n",
       " 39  [大数据, 流程管理, 交付管理, 流程优化, 化工行业, IT/互联网/软件, PMP, ...  57161555       30-35k   \n",
       " \n",
       "      job.dq job.refreshTime  \\\n",
       " 0        香港  20230411100837   \n",
       " 1    香港-沙田区  20230323163619   \n",
       " 2    香港-葵青区  20220307152316   \n",
       " 3    香港-葵青区  20220307152316   \n",
       " 4    香港-葵青区  20220307152316   \n",
       " 5    香港-葵青区  20220307152316   \n",
       " 6     香港-东区  20220810152931   \n",
       " 7        香港  20230605200800   \n",
       " 8        香港  20230531095338   \n",
       " 9    香港-湾仔区  20230120141442   \n",
       " 10       香港  20230607205632   \n",
       " 11       香港  20230605154311   \n",
       " 12       香港  20230427110506   \n",
       " 13       香港  20230426182455   \n",
       " 14       香港  20230606195711   \n",
       " 15       香港  20230614105125   \n",
       " 16   香港-葵青区  20230505151345   \n",
       " 17       香港  20230113165725   \n",
       " 18       香港  20230411101144   \n",
       " 19   香港-葵青区  20230505151345   \n",
       " 20  香港-油尖旺区  20230421135307   \n",
       " 21       香港  20230606184047   \n",
       " 22       香港  20230414221246   \n",
       " 23       香港  20230605090108   \n",
       " 24   香港-湾仔区  20230528225940   \n",
       " 25   香港-湾仔区  20230601180213   \n",
       " 26   香港-中西区  20230606180330   \n",
       " 27       香港  20230613183631   \n",
       " 28       香港  20230614104154   \n",
       " 29       香港  20230531175836   \n",
       " 30   香港-葵青区  20230414165123   \n",
       " 31       香港  20230504173835   \n",
       " 32   香港-湾仔区  20230522152426   \n",
       " 33   香港-湾仔区  20230515112932   \n",
       " 34    香港-东区  20230607112011   \n",
       " 35   香港-中西区  20230421094849   \n",
       " 36   香港-葵青区  20230307110522   \n",
       " 37   香港-湾仔区  20221031094347   \n",
       " 38       香港  20230603003258   \n",
       " 39   香港-西贡区  20230331093653   \n",
       " \n",
       "                                             job.title job.jobKind  job.topJob  \\\n",
       " 0                                             数字化产品经理           1       False   \n",
       " 1                                              售前产品经理           2       False   \n",
       " 2                 Business Management Product Manager           2       False   \n",
       " 3               IoT solution & Device Product Manager           2       False   \n",
       " 4                           5G Device Product Manager           2       False   \n",
       " 5                                SaaS Product Manager           2       False   \n",
       " 6            Product Marketing Manager_Timing Devices           2       False   \n",
       " 7                                             新产品发展经理           1       False   \n",
       " 8                EHS技术产品研发经理 EHS Solutions RD Manager           2       False   \n",
       " 9                                  HCM产品行销经理\\售前顾问（香港）           2       False   \n",
       " 10                                         海外对冲基金产品专家           2       False   \n",
       " 11                                         海外对冲基金产品专家           1       False   \n",
       " 12                                         海外对冲基金产品总监           1       False   \n",
       " 13                                        基金产品总监(FOF)           1       False   \n",
       " 14                                             财富产品专家           1       False   \n",
       " 15                          Digital Marketing Manager           1       False   \n",
       " 16                 Project Design Engineer at HK Site           2       False   \n",
       " 17                               38518H-【CRA】数据资产管理经理           2       False   \n",
       " 18                                             数字营销经理           1       False   \n",
       " 19                        Project Engineer at HK Site           2       False   \n",
       " 20                                       HelpDesk技术支持           2       False   \n",
       " 21                                           对冲基金产品专家           1       False   \n",
       " 22                                           香港高级投资经理           1       False   \n",
       " 23                                               投资经理           1       False   \n",
       " 24                                      业务流程岗(J11204)           2       False   \n",
       " 25                                    境外-创新增长运营-香港、北京           2       False   \n",
       " 26                                            产品设计工程师           2       False   \n",
       " 27  Quantitative Portfolio Manager 量化投资基金经理 - SG/C...           1       False   \n",
       " 28                                              数字化转型           1       False   \n",
       " 29                                   平台产品leader（p7/8）           1       False   \n",
       " 30  Project Engineer - Project Management and Serv...           2       False   \n",
       " 31                                 Healthcare Analyst           1       False   \n",
       " 32                                          境外-创新增长运营           2       False   \n",
       " 33                                            结构化产品专家           2       False   \n",
       " 34                                    Account Manager           2       False   \n",
       " 35                              南方基金香港子公司(南方东英) 债券交易员           2       False   \n",
       " 36                                    石油化工项目工程师（派驻香港）           2       False   \n",
       " 37                Sales and Marketing Director(Q8560)           2       False   \n",
       " 38                                               销售代表           1       False   \n",
       " 39                                    数据中心运营流程管理高级工程师           2       False   \n",
       " \n",
       "     ...          recruiter.recruiterPhoto     comp.compName  \\\n",
       " 0   ...   6316e8a847115a35510f5f0405u.jpg      某广州其他商务服务业公司   \n",
       " 1   ...   54d1e768712eb4f6b84c2d1301a.jpg    京信通信技术(广州)有限公司   \n",
       " 2   ...   5f8f9865ea60860b75384fa508u.jpg        中国移动国际有限公司   \n",
       " 3   ...   5f8f9865ea60860b75384fa508u.jpg        中国移动国际有限公司   \n",
       " 4   ...   5f8f9865ea60860b75384fa508u.jpg        中国移动国际有限公司   \n",
       " 5   ...   5f8f9865ea60860b75384fa508u.jpg        中国移动国际有限公司   \n",
       " 6   ...   60e698774a74410e54a95f6e07u.png              伊顿中国   \n",
       " 7   ...   5e1ac27d29d83a67543f2f4704u.jpg     某大型食品/饮料/酒水公司   \n",
       " 8   ...   5f8f986bdfb13a7dee342f2108u.jpg           EHSCity   \n",
       " 9   ...   6397293d5944bd7af2e009f803u.png      用友网络科技股份有限公司   \n",
       " 10  ...   5f8f986aea60860b75384fab08u.jpg      上海歌斐资产管理有限公司   \n",
       " 11  ...   5d00bb549fae687d438bbf1008u.jpg       某基金/证券/期货公司   \n",
       " 12  ...   62fd9adc2e03d62b1aac193e06u.jpg             某知名公司   \n",
       " 13  ...   5f5a2b44f6d1ab5847518fe905u.png             某知名公司   \n",
       " 14  ...   63664321cc551b286e3be87304u.png         某国资控股上市集团   \n",
       " 15  ...   5e58665829d83a6754562c9704u.jpg             某知名公司   \n",
       " 16  ...   5f8f9866dfb13a7dee342f1808u.jpg      上海协同工程咨询有限公司   \n",
       " 17  ...   5f8f9868f6d1ab58476f24a008u.jpg             金融壹账通   \n",
       " 18  ...   6316e8a847115a35510f5f0405u.jpg      某广州其他商务服务业公司   \n",
       " 19  ...   5f8f9866dfb13a7dee342f1808u.jpg      上海协同工程咨询有限公司   \n",
       " 20  ...   61e7a73229da04039cf1a16503u.png         H&M Group   \n",
       " 21  ...   5e55dbc16324626e17a753d506u.jpg        某纽交所上市金融集团   \n",
       " 22  ...   616e2fad5b0bd51fb2d357e705u.png        早期投资双币科技基金   \n",
       " 23  ...   632538562ec8597bfa3fa54f06u.png             某知名公司   \n",
       " 24  ...   5f8f98648dbe6273dcf8515508u.jpg              光大证券   \n",
       " 25  ...   5f8f98648dbe6273dcf8515508u.jpg                美团   \n",
       " 26  ...   637b1d8574c3560fc436894d02u.png    艾迪孚贝(无锡)科技有限公司   \n",
       " 27  ...   62669814a8423a1f26d50ff803u.png         某大型基金证券公司   \n",
       " 28  ...   54d0c580712e894a54c826f801a.jpg      在港中资银行背景金融机构   \n",
       " 29  ...   622899b3129d985edb29e1ab05u.jpg             某知名公司   \n",
       " 30  ...   5f8f986779c7cc70efbf36c008u.jpg        中国移动香港有限公司   \n",
       " 31  ...   6462fb556beb43237502d75e01u.png             某知名公司   \n",
       " 32  ...   5f8f9866dfb13a7dee342f1808u.jpg                美团   \n",
       " 33  ...   5f8f986779c7cc70efbf36c008u.jpg      上海歌斐资产管理有限公司   \n",
       " 34  ...   5f8f9863f6d1ab58476f246a08u.jpg  深圳前海捷创未来技术服务有限公司   \n",
       " 35  ...   5f8f9866dfb13a7dee342f1808u.jpg      南方基金管理股份有限公司   \n",
       " 36  ...   5f8f986779c7cc70efbf36c008u.jpg              必维集团   \n",
       " 37  ...   5f8f986779c7cc70efbf36c008u.jpg      上海千象资产管理有限公司   \n",
       " 38  ...  5f83e6498dbe6273dcf22bb607u.jpeg      某上海大型珠宝/首饰公司   \n",
       " 39  ...   5f8f9865ea60860b75384fa508u.jpg        中国移动国际有限公司   \n",
       " \n",
       "                       comp.compLogo comp.compScale  \\\n",
       " 0   60e2fe0bf3df194a3c48adb502u.png                  \n",
       " 1   5bfe991b74719df0ac9991cd03a.png    5000-10000人   \n",
       " 2   5bfea51674719d2aa34cd90503a.png       500-999人   \n",
       " 3   5bfea51674719d2aa34cd90503a.png       500-999人   \n",
       " 4   5bfea51674719d2aa34cd90503a.png       500-999人   \n",
       " 5   5bfea51674719d2aa34cd90503a.png       500-999人   \n",
       " 6   5bfe9df574719d2aa34b7b2203a.png       10000人以上   \n",
       " 7   60e2fe0bf3df194a3c48adb502u.png    5000-10000人   \n",
       " 8   5fedac06bebf7311a41cc9b307u.png         50-99人   \n",
       " 9   5bfe978974719df0ac993f9803a.png       10000人以上   \n",
       " 10  5bfe8fd474719d35745a83f203a.png       100-499人   \n",
       " 11  60e2fe0bf3df194a3c48adb502u.png          1-49人   \n",
       " 12  60e2fe0bf3df194a3c48adb502u.png       100-499人   \n",
       " 13  60e2fe0bf3df194a3c48adb502u.png          1-49人   \n",
       " 14  60e2fe0bf3df194a3c48adb502u.png       10000人以上   \n",
       " 15  60e2fe0bf3df194a3c48adb502u.png         50-99人   \n",
       " 16  5f07d063543a971969eb6ddc04u.jpg       10000人以上   \n",
       " 17  5f3ca396ea60860b75020faa02u.jpg     2000-5000人   \n",
       " 18  60e2fe0bf3df194a3c48adb502u.png                  \n",
       " 19  5f07d063543a971969eb6ddc04u.jpg       10000人以上   \n",
       " 20  61c533f6ff410524b7f4696c04u.png     1000-2000人   \n",
       " 21  60e2fe0bf3df194a3c48adb502u.png       10000人以上   \n",
       " 22  60e2fe0bf3df194a3c48adb502u.png         50-99人   \n",
       " 23  60e2fe0bf3df194a3c48adb502u.png          1-49人   \n",
       " 24  6401a2dfeab4507021d30bd003u.png    5000-10000人   \n",
       " 25  5fe1a95455550936bbd28ea506u.png       10000人以上   \n",
       " 26  61b07937d0458d53c627567e02u.jpg       100-499人   \n",
       " 27  60e2fe0bf3df194a3c48adb502u.png       500-999人   \n",
       " 28  60e2fe0bf3df194a3c48adb502u.png       100-499人   \n",
       " 29  60e2fe0bf3df194a3c48adb502u.png         50-99人   \n",
       " 30  62fca94128e72769b4c1d61e06u.png     1000-2000人   \n",
       " 31  60e2fe0bf3df194a3c48adb502u.png       500-999人   \n",
       " 32  5fe1a95455550936bbd28ea506u.png       10000人以上   \n",
       " 33  5bfe8fd474719d35745a83f203a.png       100-499人   \n",
       " 34  63d4d7f3334c74039df34ccc07u.png                  \n",
       " 35  60e54741e2df5862a08674ba03u.png       500-999人   \n",
       " 36  59a3d5bf70325ec22ee5823006a.jpg    5000-10000人   \n",
       " 37  59786e9b70327b30a4e6cdd404a.jpg         50-99人   \n",
       " 38  60e2fe0bf3df194a3c48adb502u.png       500-999人   \n",
       " 39  5bfea51674719d2aa34cd90503a.png       500-999人   \n",
       " \n",
       "                                    comp.link comp.compIndustry  \\\n",
       " 0                                                      其他商务服务业   \n",
       " 1     https://www.liepin.com/company/941676/              通信设备   \n",
       " 2    https://www.liepin.com/company/8932876/              通信设备   \n",
       " 3    https://www.liepin.com/company/8932876/              通信设备   \n",
       " 4    https://www.liepin.com/company/8932876/              通信设备   \n",
       " 5    https://www.liepin.com/company/8932876/              通信设备   \n",
       " 6    https://www.liepin.com/company/1069385/             机械/设备   \n",
       " 7                                                     食品/饮料/酒水   \n",
       " 8   https://www.liepin.com/company/12518769/              咨询服务   \n",
       " 9    https://www.liepin.com/company/5634845/             计算机软件   \n",
       " 10   https://www.liepin.com/company/9194127/          基金/证券/期货   \n",
       " 11                                                    基金/证券/期货   \n",
       " 12                                                      专业技术服务   \n",
       " 13                                                      专业技术服务   \n",
       " 14                                                        融资租赁   \n",
       " 15                                                    食品/饮料/酒水   \n",
       " 16  https://www.liepin.com/company/12281677/        工程管理/勘察/监理   \n",
       " 17   https://www.liepin.com/company/8226823/              科技金融   \n",
       " 18                                                     其他商务服务业   \n",
       " 19  https://www.liepin.com/company/12281677/        工程管理/勘察/监理   \n",
       " 20   https://www.liepin.com/company/8373588/          服装/纺织/皮革   \n",
       " 21                                                    基金/证券/投资   \n",
       " 22                                                    基金/证券/投资   \n",
       " 23                                                        咨询服务   \n",
       " 24   https://www.liepin.com/company/8441886/          基金/证券/期货   \n",
       " 25   https://www.liepin.com/company/2036768/               互联网   \n",
       " 26  https://www.liepin.com/company/13356841/          印刷/包装/造纸   \n",
       " 27                                                    基金/证券/期货   \n",
       " 28                                                    基金/证券/投资   \n",
       " 29                                                    基金/证券/期货   \n",
       " 30  https://www.liepin.com/company/13211309/          运营商/增值服务   \n",
       " 31                                                    房地产租赁/中介   \n",
       " 32   https://www.liepin.com/company/2036768/               互联网   \n",
       " 33   https://www.liepin.com/company/9194127/          基金/证券/期货   \n",
       " 34  https://www.liepin.com/company/13382597/             计算机软件   \n",
       " 35   https://www.liepin.com/company/9689158/          基金/证券/期货   \n",
       " 36   https://www.liepin.com/company/9294742/             检测/认证   \n",
       " 37   https://www.liepin.com/company/8177652/          基金/证券/期货   \n",
       " 38                                                       珠宝/首饰   \n",
       " 39   https://www.liepin.com/company/8932876/              通信设备   \n",
       " \n",
       "    job.pcOuterLink job.h5OuterLink comp.compId  comp.compStage  \n",
       " 0              NaN             NaN         NaN             NaN  \n",
       " 1                                     941676.0             NaN  \n",
       " 2                                    8932876.0             NaN  \n",
       " 3                                    8932876.0             NaN  \n",
       " 4                                    8932876.0             NaN  \n",
       " 5                                    8932876.0             NaN  \n",
       " 6                                    1069385.0             NaN  \n",
       " 7              NaN             NaN         NaN           融资未公开  \n",
       " 8                                   12518769.0             NaN  \n",
       " 9                                    5634845.0             已上市  \n",
       " 10                                   9194127.0             NaN  \n",
       " 11             NaN             NaN         NaN           融资未公开  \n",
       " 12             NaN             NaN         NaN           融资未公开  \n",
       " 13             NaN             NaN         NaN            战略融资  \n",
       " 14             NaN             NaN         NaN           融资未公开  \n",
       " 15             NaN             NaN         NaN             NaN  \n",
       " 16                                  12281677.0             NaN  \n",
       " 17                                   8226823.0            美股上市  \n",
       " 18             NaN             NaN         NaN             NaN  \n",
       " 19                                  12281677.0             NaN  \n",
       " 20                                   8373588.0             NaN  \n",
       " 21             NaN             NaN         NaN             已上市  \n",
       " 22             NaN             NaN         NaN              其他  \n",
       " 23             NaN             NaN         NaN           融资未公开  \n",
       " 24                                   8441886.0             已上市  \n",
       " 25                                   2036768.0            港股上市  \n",
       " 26                                  13356841.0             NaN  \n",
       " 27             NaN             NaN         NaN           融资未公开  \n",
       " 28             NaN             NaN         NaN           融资未公开  \n",
       " 29             NaN             NaN         NaN           融资未公开  \n",
       " 30                                  13211309.0             NaN  \n",
       " 31             NaN             NaN         NaN           融资未公开  \n",
       " 32                                   2036768.0            港股上市  \n",
       " 33                                   9194127.0             NaN  \n",
       " 34                                  13382597.0             NaN  \n",
       " 35                                   9689158.0             NaN  \n",
       " 36                                   9294742.0             NaN  \n",
       " 37                                   8177652.0             NaN  \n",
       " 38             NaN             NaN         NaN           融资未公开  \n",
       " 39                                   8932876.0             NaN  \n",
       " \n",
       " [40 rows x 31 columns],\n",
       "                                            dataParams  \\\n",
       " 0   {\"recruiterName\":\"谢女士\",\"imId\":\"e39bf1a7adbdc68...   \n",
       " 1   {\"recruiterName\":\"刘女士\",\"imId\":\"ca72b99f7e34618...   \n",
       " 2   {\"recruiterName\":\"刘先生\",\"imId\":\"a9c9b2abdc5ef81...   \n",
       " 3   {\"recruiterName\":\"金先生\",\"imId\":\"bd51e80ad9b3299...   \n",
       " 4   {\"recruiterName\":\"陆女士\",\"imId\":\"0c667bfd5866397...   \n",
       " 5   {\"recruiterName\":\"尹女士\",\"imId\":\"65d97f4d17e9d03...   \n",
       " 6   {\"recruiterName\":\"梁女士\",\"imId\":\"4bd7f52f246cb60...   \n",
       " 7   {\"recruiterName\":\"尹女士\",\"imId\":\"65d97f4d17e9d03...   \n",
       " 8   {\"recruiterName\":\"兰女士\",\"imId\":\"563de8146b5c88e...   \n",
       " 9   {\"recruiterName\":\"唐女士\",\"imId\":\"296718bfbfbe047...   \n",
       " 10  {\"recruiterName\":\"尹女士\",\"imId\":\"65d97f4d17e9d03...   \n",
       " 11  {\"recruiterName\":\"郭女士\",\"imId\":\"1fe92b456ed95f8...   \n",
       " 12  {\"recruiterName\":\"张女士\",\"imId\":\"f888fb213363e21...   \n",
       " 13  {\"recruiterName\":\"林女士\",\"imId\":\"48db9ec3c0caa03...   \n",
       " 14  {\"recruiterName\":\"严先生\",\"imId\":\"7386a62c478c822...   \n",
       " 15  {\"recruiterName\":\"王女士\",\"imId\":\"c07e1e29b548168...   \n",
       " 16  {\"recruiterName\":\"Lau Tsz Yan\",\"imId\":\"c16c501...   \n",
       " 17  {\"recruiterName\":\"余女士\",\"imId\":\"55345e65008632f...   \n",
       " 18  {\"recruiterName\":\"严先生\",\"imId\":\"7386a62c478c822...   \n",
       " 19  {\"recruiterName\":\"卢女士\",\"imId\":\"35202df2ec70a60...   \n",
       " 20  {\"recruiterName\":\"张先生\",\"imId\":\"c19a3d02ddef322...   \n",
       " 21  {\"recruiterName\":\"刘先生\",\"imId\":\"682bfec45734845...   \n",
       " 22  {\"recruiterName\":\"孙女士\",\"imId\":\"af41426a1c20aec...   \n",
       " 23  {\"recruiterName\":\"李先生\",\"imId\":\"78f0c56ea510c96...   \n",
       " 24  {\"recruiterName\":\"张先生\",\"imId\":\"4957d4f10187b67...   \n",
       " 25  {\"recruiterName\":\"林女士\",\"imId\":\"e0944bb808b7f30...   \n",
       " 26  {\"recruiterName\":\"陈女士\",\"imId\":\"391cce9e9c117e5...   \n",
       " 27  {\"recruiterName\":\"张女士\",\"imId\":\"1f106856e3e5293...   \n",
       " 28  {\"recruiterName\":\"石女士\",\"imId\":\"1b3d0b15ea2bc13...   \n",
       " \n",
       "                                              dataInfo  \\\n",
       " 0   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 1   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 2   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 3   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 4   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 5   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 6   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 7   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 8   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 9   %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 10  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 11  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 12  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 13  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 14  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 15  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 16  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 17  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 18  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 19  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 20  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 21  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 22  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 23  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 24  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 25  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 26  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 27  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " 28  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       " \n",
       "                                            job.labels job.jobKind  \\\n",
       " 0                           [项目工程师, 香港工作, 土木工程, 结构工程]           1   \n",
       " 1                      [金融产品, 金融行业, 征信行业, 用户研究, 产品规划]           1   \n",
       " 2                                                  []           1   \n",
       " 3                                        [数据产品, 数据挖掘]           2   \n",
       " 4                                                  []           2   \n",
       " 5                                                  []           2   \n",
       " 6                         [质量管理, 风控项目, ASP.NET, .NET]           2   \n",
       " 7                                                  []           2   \n",
       " 8                                            [项目施工管理]           2   \n",
       " 9   [金融产品, 互联网金融, 金融理财/贷款, 金融行业, IT互联网, 批发/零售, 产品设...           2   \n",
       " 10                                                 []           2   \n",
       " 11                                                 []           2   \n",
       " 12                                                 []           2   \n",
       " 13                                                 []           1   \n",
       " 14  [出入库管理, 仓库管理, 订单管理, 库存管理, 库存盘点, 现场管理, 海外仓, 贸易/...           2   \n",
       " 15  [saas, 市场洞察, 客户管理, IT/互联网/软件, 电子/通信/硬件, 团队管理, ...           2   \n",
       " 16             [网络营销, 策划, 市场营销, office, 整合营销, 数据统计分析]           2   \n",
       " 17                                                 []           2   \n",
       " 18  [海外仓, 出入库管理, 库存盘点, 仓库管理, 库存管理, 现场管理, 消费品, 贸易/进...           2   \n",
       " 19   [软件测试, selenium, appium, automation, 自动化, 自动化测试]           2   \n",
       " 20                                              [SQL]           2   \n",
       " 21                                                 []           2   \n",
       " 22                                                 []           1   \n",
       " 23                                             [客户服务]           2   \n",
       " 24                                                 []           1   \n",
       " 25                                               [本科]           6   \n",
       " 26                                   [本科, 功能测试, 软件测试]           6   \n",
       " 27               [本科, 软件测试, 应用测试, 功能测试, iOS, Android]           6   \n",
       " 28                                               [本科]           6   \n",
       " \n",
       "                                         job.title  job.salary   job.dq  \\\n",
       " 0                        90M0116548项目工程师(base 香港）      20-30k       香港   \n",
       " 1                                        产品解决方案专家  30-50k·16薪       香港   \n",
       " 2     （Senior）Category Manager (Global Marketing)    3-5k·15薪       香港   \n",
       " 3                              38518C-【CRA】征信模型设计      12-24k       香港   \n",
       " 4                                      南方东英-固收交易员        薪资面议   香港-中西区   \n",
       " 5                                   业务流程岗(J11204)      15-30k   香港-湾仔区   \n",
       " 6                              石油化工项目-设计工程师（派驻香港）      30-40k   香港-葵青区   \n",
       " 7                                     产品岗(J11203)      15-30k   香港-湾仔区   \n",
       " 8          Project Document Controller at HK Site      10-16k   香港-葵青区   \n",
       " 9                                 蚂蚁集团-产品专家-国际事业群  29-50k·16薪   香港-湾仔区   \n",
       " 10                                    产品岗(J11146)      25-30k   香港-湾仔区   \n",
       " 11                 Associate, Product Development  20-35k·15薪   香港-中西区   \n",
       " 12                                Account Manager      40-70k    香港-东区   \n",
       " 13                     高级ICT技术经理 （云网，安全，大数据等技术方向)  40-60k·13薪  香港-九龙城区   \n",
       " 14                                           仓库文员  14-18k·13薪   香港-元朗区   \n",
       " 15                                         商务开发经理  15-30k·14薪   香港-沙田区   \n",
       " 16           Assistant Manager, Digital Marketing      32-37k  香港-油尖旺区   \n",
       " 17                             IT Project Manager      30-60k   香港-湾仔区   \n",
       " 18                                           仓库组长  13-18k·13薪   香港-元朗区   \n",
       " 19                                        QA测试工程师      30-35k  香港-深水埗区   \n",
       " 20                    Senior Program Manager - HK      40-70k       香港   \n",
       " 21                                     9号牌RO（负责人）      45-55k       香港   \n",
       " 22                                   证券投资经理（产品策略）     70-100k   香港-中西区   \n",
       " 23       客户服务经理Product & Customer Service Manager        薪资面议   香港-中西区   \n",
       " 24                               风险合规经理（离岸财富管理产品）  40-70k·18薪       香港   \n",
       " 25                                           产品经理      12-25k   香港-湾仔区   \n",
       " 26                                   软件测试应届生（23届）      20-25k       香港   \n",
       " 27                                       APP测试工程师      20-25k    香港-东区   \n",
       " 28  Graduate Engineer (Civil and MEP Engineering)      20-21k  香港-油尖旺区   \n",
       " \n",
       "    job.refreshTime job.jobId  \\\n",
       " 0   20230510114027  45988881   \n",
       " 1   20230512101034  45314055   \n",
       " 2   20230512180619  46084381   \n",
       " 3   20221019114143  52877713   \n",
       " 4   20230421094845  55377327   \n",
       " 5   20230528225940  55518261   \n",
       " 6   20230307110649  52236989   \n",
       " 7   20230314175648  55518217   \n",
       " 8   20230505151345  52324805   \n",
       " 9   20220627182122  50701623   \n",
       " 10  20230314175658  54850547   \n",
       " 11  20220830181022  52269147   \n",
       " 12  20230607112011  58635435   \n",
       " 13  20230320181620  44567933   \n",
       " 14  20221130092435  52839935   \n",
       " 15  20220916172601  52515213   \n",
       " 16  20210407193222  37908187   \n",
       " 17  20210813101005  42097463   \n",
       " 18  20221130092445  52841325   \n",
       " 19  20210414103726  37756355   \n",
       " 20  20230613145827  59294969   \n",
       " 21  20220104124215  46141861   \n",
       " 22  20230512111449  45991121   \n",
       " 23  20230515110246  52796263   \n",
       " 24  20230522113042  46316869   \n",
       " 25  20210223134718  36105889   \n",
       " 26  20230613110233  59283885   \n",
       " 27  20230506100220  58318215   \n",
       " 28  20230614100413  57158615   \n",
       " \n",
       "                                        job.dataPromId  ...  comp.compStage  \\\n",
       " 0   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...           不需要融资   \n",
       " 1   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...           融资未公开   \n",
       " 2   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...           融资未公开   \n",
       " 3   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...            美股上市   \n",
       " 4   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 5   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             已上市   \n",
       " 6   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 7   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             已上市   \n",
       " 8   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 9   d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...              B轮   \n",
       " 10  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             已上市   \n",
       " 11  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 12  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 13  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 14  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...              其他   \n",
       " 15  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 16  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 17  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 18  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...              其他   \n",
       " 19  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 20  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 21  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 22  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 23  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 24  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...           融资未公开   \n",
       " 25  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 26  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...           融资未公开   \n",
       " 27  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " 28  d_sfrom=search_prime&d_ckId=null&d_curPage=2&d...  ...             NaN   \n",
       " \n",
       "                       comp.compLogo  comp.compScale     comp.compName  \\\n",
       " 0   60e2fe0bf3df194a3c48adb502u.png        10000人以上             某知名公司   \n",
       " 1   60e2fe0bf3df194a3c48adb502u.png     5000-10000人        某深圳大型互联网公司   \n",
       " 2   60e2fe0bf3df194a3c48adb502u.png        100-499人       某上海人力资源服务公司   \n",
       " 3   5f3ca396ea60860b75020faa02u.jpg      2000-5000人             金融壹账通   \n",
       " 4   60e54741e2df5862a08674ba03u.png        500-999人      南方基金管理股份有限公司   \n",
       " 5   6401a2dfeab4507021d30bd003u.png     5000-10000人              光大证券   \n",
       " 6   59a3d5bf70325ec22ee5823006a.jpg     5000-10000人              必维集团   \n",
       " 7   6401a2dfeab4507021d30bd003u.png     5000-10000人              光大证券   \n",
       " 8   5f07d063543a971969eb6ddc04u.jpg        10000人以上      上海协同工程咨询有限公司   \n",
       " 9   62567089cff8571d7c28d47c03u.png     5000-10000人              蚂蚁集团   \n",
       " 10  6401a2dfeab4507021d30bd003u.png     5000-10000人              光大证券   \n",
       " 11  61b07937d0458d53c627567e02u.jpg           1-49人     港交所(深圳)控股有限公司   \n",
       " 12  63d4d7f3334c74039df34ccc07u.png                  深圳前海捷创未来技术服务有限公司   \n",
       " 13  60e2fe0bf3df194a3c48adb502u.png        500-999人         某大型通信设备公司   \n",
       " 14  5e0d529f6324626e1789ab2807u.png     5000-10000人      上海识装信息科技有限公司   \n",
       " 15  61b07937d0458d53c627567e02u.jpg          50-99人        耀通科技投资有限公司   \n",
       " 16  596703ff703287e466d532bd05a.jpg        10000人以上               优衣库   \n",
       " 17  64644efa870d6b1f1bd7c75708u.png        100-499人    安山国际控股(广东)有限公司   \n",
       " 18  5e0d529f6324626e1789ab2807u.png     5000-10000人      上海识装信息科技有限公司   \n",
       " 19  61b07937d0458d53c627567e02u.jpg                          分子金融有限公司   \n",
       " 20  5a28acf07032d5b4c547580d04a.jpg     5000-10000人               亚马逊   \n",
       " 21  61b07937d0458d53c627567e02u.jpg           1-49人    苏州奥普雷斯资产管理有限公司   \n",
       " 22  60e2fe0bf3df194a3c48adb502u.png          50-99人               某公司   \n",
       " 23  59b1f9eb70325ec22eea93a305a.jpg        500-999人              嘉实财富   \n",
       " 24  60e2fe0bf3df194a3c48adb502u.png        500-999人        某公募基金理财子公司   \n",
       " 25  616f846645a2627dc008eaa008u.png      2000-5000人        华润数科控股有限公司   \n",
       " 26  62b3ce0c8cd3bf59a05ff51d04u.png        100-499人      成都无敌勇士科技有限公司   \n",
       " 27  61b07937d0458d53c627567e02u.jpg                     Winner Studio   \n",
       " 28  5cd93b94501544662c710a6c05u.png        100-499人              阿特金斯   \n",
       " \n",
       "    comp.compIndustry                                 comp.link  \\\n",
       " 0             人力资源服务                                             \n",
       " 1                互联网                                             \n",
       " 2             人力资源服务                                             \n",
       " 3               科技金融   https://www.liepin.com/company/8226823/   \n",
       " 4           基金/证券/期货   https://www.liepin.com/company/9689158/   \n",
       " 5           基金/证券/期货   https://www.liepin.com/company/8441886/   \n",
       " 6              检测/认证   https://www.liepin.com/company/9294742/   \n",
       " 7           基金/证券/期货   https://www.liepin.com/company/8441886/   \n",
       " 8         工程管理/勘察/监理  https://www.liepin.com/company/12281677/   \n",
       " 9               科技金融   https://www.liepin.com/company/8968236/   \n",
       " 10          基金/证券/期货   https://www.liepin.com/company/8441886/   \n",
       " 11          财务/审计/税务  https://www.liepin.com/company/12399159/   \n",
       " 12             计算机软件  https://www.liepin.com/company/13382597/   \n",
       " 13              通信设备                                             \n",
       " 14               互联网   https://www.liepin.com/company/9698935/   \n",
       " 15             计算机软件  https://www.liepin.com/company/13311913/   \n",
       " 16          服装/纺织/皮革   https://www.liepin.com/company/5279887/   \n",
       " 17          基金/证券/期货  https://www.liepin.com/company/10035863/   \n",
       " 18               互联网   https://www.liepin.com/company/9698935/   \n",
       " 19              IT服务  https://www.liepin.com/company/12664927/   \n",
       " 20               互联网   https://www.liepin.com/company/8642300/   \n",
       " 21          基金/证券/期货  https://www.liepin.com/company/12979213/   \n",
       " 22              咨询服务                                             \n",
       " 23          基金/证券/期货   https://www.liepin.com/company/8437694/   \n",
       " 24          基金/证券/投资                                             \n",
       " 25              人工智能  https://www.liepin.com/company/12208295/   \n",
       " 26                游戏   https://www.liepin.com/company/9861675/   \n",
       " 27                游戏  https://www.liepin.com/company/13447701/   \n",
       " 28           房地产开发经营   https://www.liepin.com/company/2680101/   \n",
       " \n",
       "    job.pcOuterLink job.h5OuterLink comp.compId  job.campusJobKind  \n",
       " 0              NaN             NaN         NaN                NaN  \n",
       " 1              NaN             NaN         NaN                NaN  \n",
       " 2              NaN             NaN         NaN                NaN  \n",
       " 3                                    8226823.0                NaN  \n",
       " 4                                    9689158.0                NaN  \n",
       " 5                                    8441886.0                NaN  \n",
       " 6                                    9294742.0                NaN  \n",
       " 7                                    8441886.0                NaN  \n",
       " 8                                   12281677.0                NaN  \n",
       " 9                                    8968236.0                NaN  \n",
       " 10                                   8441886.0                NaN  \n",
       " 11                                  12399159.0                NaN  \n",
       " 12                                  13382597.0                NaN  \n",
       " 13             NaN             NaN         NaN                NaN  \n",
       " 14                                   9698935.0                NaN  \n",
       " 15                                  13311913.0                NaN  \n",
       " 16                                   5279887.0                NaN  \n",
       " 17                                  10035863.0                NaN  \n",
       " 18                                   9698935.0                NaN  \n",
       " 19                                  12664927.0                NaN  \n",
       " 20                                   8642300.0                NaN  \n",
       " 21                                  12979213.0                NaN  \n",
       " 22             NaN             NaN         NaN                NaN  \n",
       " 23                                   8437694.0                NaN  \n",
       " 24             NaN             NaN         NaN                NaN  \n",
       " 25                                  12208295.0                 应届  \n",
       " 26                                   9861675.0                 应届  \n",
       " 27                                  13447701.0                 应届  \n",
       " 28                                   2680101.0                 应届  \n",
       " \n",
       " [29 rows x 32 columns]]"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "response_df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "execution": {
     "iopub.status.busy": "2023-05-31T12:46:29.792246Z",
     "iopub.status.idle": "2023-05-31T12:46:29.792555Z",
     "shell.execute_reply": "2023-05-31T12:46:29.792418Z",
     "shell.execute_reply.started": "2023-05-31T12:46:29.792405Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "pd.json_normalize(response_data['data']['data']['jobCardList'])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 数据整理成为表格\n",
    "> 1. pandas 中的concat方法"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:00:36.613427Z",
     "iopub.status.busy": "2023-06-14T09:00:36.611950Z",
     "iopub.status.idle": "2023-06-14T09:00:36.678792Z",
     "shell.execute_reply": "2023-06-14T09:00:36.677596Z",
     "shell.execute_reply.started": "2023-06-14T09:00:36.613371Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataInfo</th>\n",
       "      <th>dataParams</th>\n",
       "      <th>job.labels</th>\n",
       "      <th>job.salary</th>\n",
       "      <th>job.dq</th>\n",
       "      <th>job.requireWorkYears</th>\n",
       "      <th>job.refreshTime</th>\n",
       "      <th>job.jobId</th>\n",
       "      <th>job.jobKind</th>\n",
       "      <th>job.topJob</th>\n",
       "      <th>...</th>\n",
       "      <th>recruiter.recruiterTitle</th>\n",
       "      <th>recruiter.recruiterPhoto</th>\n",
       "      <th>comp.compId</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.compStage</th>\n",
       "      <th>comp.compLogo</th>\n",
       "      <th>comp.link</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "      <th>job.campusJobKind</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...</td>\n",
       "      <td>[金融产品, 征信行业, 金融行业, 金融理财/贷款, 批发/零售, 产品优化, 产品设计,...</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20221118143443</td>\n",
       "      <td>51880109</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>人力资源经理/主管</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>8226823.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>金融壹账通</td>\n",
       "      <td>美股上市</td>\n",
       "      <td>5f3ca396ea60860b75020faa02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/8226823/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...</td>\n",
       "      <td>[IT互联网, SaaS产品, to B, 产品设计, 移动端产品]</td>\n",
       "      <td>25-40k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>58720383</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>Talent Acquisition Manager</td>\n",
       "      <td>61e1521019ffac3de11dd5c403u.png</td>\n",
       "      <td>13057723.0</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13057723/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...</td>\n",
       "      <td>[]</td>\n",
       "      <td>40-60k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>58720027</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>Talent Acquisition Manager</td>\n",
       "      <td>61e1521019ffac3de11dd5c403u.png</td>\n",
       "      <td>13057723.0</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13057723/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"1efac136cbe60a32a3ebc0e282cc3953\",\"...</td>\n",
       "      <td>[交易产品, 金融行业]</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-中西区</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20221230112638</td>\n",
       "      <td>55273999</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td></td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>4580900.0</td>\n",
       "      <td>5000-10000人</td>\n",
       "      <td>中国国际金融股份有限公司</td>\n",
       "      <td>沪深A股上市</td>\n",
       "      <td>5bcd8a2f8e50a3257f7102c304a.jpg</td>\n",
       "      <td>https://www.liepin.com/company/4580900/</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"8aca73f4bae4fc17102021541d30443c\",\"...</td>\n",
       "      <td>[]</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20220810153828</td>\n",
       "      <td>51789749</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>Sourcer</td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>1069385.0</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>伊顿中国</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5bfe9df574719d2aa34b7b2203a.png</td>\n",
       "      <td>https://www.liepin.com/company/1069385/</td>\n",
       "      <td>机械/设备</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"张先生\",\"imId\":\"4957d4f10187b67...</td>\n",
       "      <td>[]</td>\n",
       "      <td>40-70k·18薪</td>\n",
       "      <td>香港</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20230522113042</td>\n",
       "      <td>46316869</td>\n",
       "      <td>1</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>猎头顾问</td>\n",
       "      <td>5a95fa858e50c5b3522c209306a.png</td>\n",
       "      <td>NaN</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>某公募基金理财子公司</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td></td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"林女士\",\"imId\":\"e0944bb808b7f30...</td>\n",
       "      <td>[本科]</td>\n",
       "      <td>12-25k</td>\n",
       "      <td>香港-湾仔区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20210223134718</td>\n",
       "      <td>36105889</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td></td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>12208295.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>华润数科控股有限公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>616f846645a2627dc008eaa008u.png</td>\n",
       "      <td>https://www.liepin.com/company/12208295/</td>\n",
       "      <td>人工智能</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"陈女士\",\"imId\":\"391cce9e9c117e5...</td>\n",
       "      <td>[本科, 功能测试, 软件测试]</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230613110233</td>\n",
       "      <td>59283885</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>HR</td>\n",
       "      <td>63a26c44dab8425fae0e7e1b03u.png</td>\n",
       "      <td>9861675.0</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>成都无敌勇士科技有限公司</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>62b3ce0c8cd3bf59a05ff51d04u.png</td>\n",
       "      <td>https://www.liepin.com/company/9861675/</td>\n",
       "      <td>游戏</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"张女士\",\"imId\":\"1f106856e3e5293...</td>\n",
       "      <td>[本科, 软件测试, 应用测试, 功能测试, iOS, Android]</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230506100220</td>\n",
       "      <td>58318215</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td></td>\n",
       "      <td>5f8f986779c7cc70efbf36c008u.jpg</td>\n",
       "      <td>13447701.0</td>\n",
       "      <td></td>\n",
       "      <td>Winner Studio</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13447701/</td>\n",
       "      <td>游戏</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"石女士\",\"imId\":\"1b3d0b15ea2bc13...</td>\n",
       "      <td>[本科]</td>\n",
       "      <td>20-21k</td>\n",
       "      <td>香港-油尖旺区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230614100413</td>\n",
       "      <td>57158615</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>senior recruiter</td>\n",
       "      <td>5f8f98648dbe6273dcf8515508u.jpg</td>\n",
       "      <td>2680101.0</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>阿特金斯</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5cd93b94501544662c710a6c05u.png</td>\n",
       "      <td>https://www.liepin.com/company/2680101/</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>109 rows × 32 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                             dataInfo  \\\n",
       "0   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "1   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "2   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "3   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "4   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "..                                                ...   \n",
       "24  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "25  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "26  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "27  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "28  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "\n",
       "                                           dataParams  \\\n",
       "0   {\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...   \n",
       "1   {\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...   \n",
       "2   {\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...   \n",
       "3   {\"userId\":\"1efac136cbe60a32a3ebc0e282cc3953\",\"...   \n",
       "4   {\"userId\":\"8aca73f4bae4fc17102021541d30443c\",\"...   \n",
       "..                                                ...   \n",
       "24  {\"recruiterName\":\"张先生\",\"imId\":\"4957d4f10187b67...   \n",
       "25  {\"recruiterName\":\"林女士\",\"imId\":\"e0944bb808b7f30...   \n",
       "26  {\"recruiterName\":\"陈女士\",\"imId\":\"391cce9e9c117e5...   \n",
       "27  {\"recruiterName\":\"张女士\",\"imId\":\"1f106856e3e5293...   \n",
       "28  {\"recruiterName\":\"石女士\",\"imId\":\"1b3d0b15ea2bc13...   \n",
       "\n",
       "                                           job.labels  job.salary   job.dq  \\\n",
       "0   [金融产品, 征信行业, 金融行业, 金融理财/贷款, 批发/零售, 产品优化, 产品设计,...        薪资面议   香港-观塘区   \n",
       "1                  [IT互联网, SaaS产品, to B, 产品设计, 移动端产品]      25-40k   香港-观塘区   \n",
       "2                                                  []      40-60k   香港-观塘区   \n",
       "3                                        [交易产品, 金融行业]        薪资面议   香港-中西区   \n",
       "4                                                  []        薪资面议    香港-东区   \n",
       "..                                                ...         ...      ...   \n",
       "24                                                 []  40-70k·18薪       香港   \n",
       "25                                               [本科]      12-25k   香港-湾仔区   \n",
       "26                                   [本科, 功能测试, 软件测试]      20-25k       香港   \n",
       "27               [本科, 软件测试, 应用测试, 功能测试, iOS, Android]      20-25k    香港-东区   \n",
       "28                                               [本科]      20-21k  香港-油尖旺区   \n",
       "\n",
       "   job.requireWorkYears job.refreshTime job.jobId job.jobKind  job.topJob  \\\n",
       "0                  3-5年  20221118143443  51880109           2       False   \n",
       "1                 5-10年  20230602174402  58720383           2       False   \n",
       "2                  3-5年  20230602174402  58720027           2       False   \n",
       "3                 5-10年  20221230112638  55273999           2       False   \n",
       "4                 10年以上  20220810153828  51789749           2       False   \n",
       "..                  ...             ...       ...         ...         ...   \n",
       "24                5-10年  20230522113042  46316869           1       False   \n",
       "25                  NaN  20210223134718  36105889           6       False   \n",
       "26                  NaN  20230613110233  59283885           6       False   \n",
       "27                  NaN  20230506100220  58318215           6       False   \n",
       "28                  NaN  20230614100413  57158615           6       False   \n",
       "\n",
       "    ...    recruiter.recruiterTitle         recruiter.recruiterPhoto  \\\n",
       "0   ...                   人力资源经理/主管  5f8f9866dfb13a7dee342f1808u.jpg   \n",
       "1   ...  Talent Acquisition Manager  61e1521019ffac3de11dd5c403u.png   \n",
       "2   ...  Talent Acquisition Manager  61e1521019ffac3de11dd5c403u.png   \n",
       "3   ...                              5f8f9865ea60860b75384fa508u.jpg   \n",
       "4   ...                     Sourcer  5f8f9865ea60860b75384fa508u.jpg   \n",
       "..  ...                         ...                              ...   \n",
       "24  ...                        猎头顾问  5a95fa858e50c5b3522c209306a.png   \n",
       "25  ...                              5f8f9866dfb13a7dee342f1808u.jpg   \n",
       "26  ...                          HR  63a26c44dab8425fae0e7e1b03u.png   \n",
       "27  ...                              5f8f986779c7cc70efbf36c008u.jpg   \n",
       "28  ...            senior recruiter  5f8f98648dbe6273dcf8515508u.jpg   \n",
       "\n",
       "   comp.compId comp.compScale                  comp.compName comp.compStage  \\\n",
       "0    8226823.0     2000-5000人                          金融壹账通           美股上市   \n",
       "1   13057723.0         50-99人  KPay merchant service limited            NaN   \n",
       "2   13057723.0         50-99人  KPay merchant service limited            NaN   \n",
       "3    4580900.0    5000-10000人                   中国国际金融股份有限公司         沪深A股上市   \n",
       "4    1069385.0       10000人以上                           伊顿中国            NaN   \n",
       "..         ...            ...                            ...            ...   \n",
       "24         NaN       500-999人                     某公募基金理财子公司          融资未公开   \n",
       "25  12208295.0     2000-5000人                     华润数科控股有限公司            NaN   \n",
       "26   9861675.0       100-499人                   成都无敌勇士科技有限公司          融资未公开   \n",
       "27  13447701.0                                 Winner Studio            NaN   \n",
       "28   2680101.0       100-499人                           阿特金斯            NaN   \n",
       "\n",
       "                      comp.compLogo                                 comp.link  \\\n",
       "0   5f3ca396ea60860b75020faa02u.jpg   https://www.liepin.com/company/8226823/   \n",
       "1   61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13057723/   \n",
       "2   61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13057723/   \n",
       "3   5bcd8a2f8e50a3257f7102c304a.jpg   https://www.liepin.com/company/4580900/   \n",
       "4   5bfe9df574719d2aa34b7b2203a.png   https://www.liepin.com/company/1069385/   \n",
       "..                              ...                                       ...   \n",
       "24  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       "25  616f846645a2627dc008eaa008u.png  https://www.liepin.com/company/12208295/   \n",
       "26  62b3ce0c8cd3bf59a05ff51d04u.png   https://www.liepin.com/company/9861675/   \n",
       "27  61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13447701/   \n",
       "28  5cd93b94501544662c710a6c05u.png   https://www.liepin.com/company/2680101/   \n",
       "\n",
       "   comp.compIndustry job.campusJobKind  \n",
       "0               科技金融               NaN  \n",
       "1               科技金融               NaN  \n",
       "2               科技金融               NaN  \n",
       "3           基金/证券/期货               NaN  \n",
       "4              机械/设备               NaN  \n",
       "..               ...               ...  \n",
       "24          基金/证券/投资               NaN  \n",
       "25              人工智能                应届  \n",
       "26                游戏                应届  \n",
       "27                游戏                应届  \n",
       "28           房地产开发经营                应届  \n",
       "\n",
       "[109 rows x 32 columns]"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.concat(response_df)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:00:40.413373Z",
     "iopub.status.busy": "2023-06-14T09:00:40.412420Z",
     "iopub.status.idle": "2023-06-14T09:00:40.646794Z",
     "shell.execute_reply": "2023-06-14T09:00:40.645798Z",
     "shell.execute_reply.started": "2023-06-14T09:00:40.413324Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [],
   "source": [
    "df.to_excel('liepin_PM_0510.xlsx')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 数据整理成为表格\n",
    "> 1.pandas 中的concat方法"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:02:37.648161Z",
     "iopub.status.busy": "2023-06-14T09:02:37.646927Z",
     "iopub.status.idle": "2023-06-14T09:02:37.696190Z",
     "shell.execute_reply": "2023-06-14T09:02:37.695300Z",
     "shell.execute_reply.started": "2023-06-14T09:02:37.648120Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataInfo</th>\n",
       "      <th>dataParams</th>\n",
       "      <th>job.labels</th>\n",
       "      <th>job.salary</th>\n",
       "      <th>job.dq</th>\n",
       "      <th>job.requireWorkYears</th>\n",
       "      <th>job.refreshTime</th>\n",
       "      <th>job.jobId</th>\n",
       "      <th>job.jobKind</th>\n",
       "      <th>job.topJob</th>\n",
       "      <th>...</th>\n",
       "      <th>recruiter.recruiterTitle</th>\n",
       "      <th>recruiter.recruiterPhoto</th>\n",
       "      <th>comp.compId</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.compStage</th>\n",
       "      <th>comp.compLogo</th>\n",
       "      <th>comp.link</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "      <th>job.campusJobKind</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...</td>\n",
       "      <td>[金融产品, 征信行业, 金融行业, 金融理财/贷款, 批发/零售, 产品优化, 产品设计,...</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20221118143443</td>\n",
       "      <td>51880109</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>人力资源经理/主管</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>8226823.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>金融壹账通</td>\n",
       "      <td>美股上市</td>\n",
       "      <td>5f3ca396ea60860b75020faa02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/8226823/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...</td>\n",
       "      <td>[IT互联网, SaaS产品, to B, 产品设计, 移动端产品]</td>\n",
       "      <td>25-40k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>58720383</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>Talent Acquisition Manager</td>\n",
       "      <td>61e1521019ffac3de11dd5c403u.png</td>\n",
       "      <td>13057723.0</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13057723/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...</td>\n",
       "      <td>[]</td>\n",
       "      <td>40-60k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>58720027</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>Talent Acquisition Manager</td>\n",
       "      <td>61e1521019ffac3de11dd5c403u.png</td>\n",
       "      <td>13057723.0</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13057723/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"1efac136cbe60a32a3ebc0e282cc3953\",\"...</td>\n",
       "      <td>[交易产品, 金融行业]</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-中西区</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20221230112638</td>\n",
       "      <td>55273999</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td></td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>4580900.0</td>\n",
       "      <td>5000-10000人</td>\n",
       "      <td>中国国际金融股份有限公司</td>\n",
       "      <td>沪深A股上市</td>\n",
       "      <td>5bcd8a2f8e50a3257f7102c304a.jpg</td>\n",
       "      <td>https://www.liepin.com/company/4580900/</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"8aca73f4bae4fc17102021541d30443c\",\"...</td>\n",
       "      <td>[]</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20220810153828</td>\n",
       "      <td>51789749</td>\n",
       "      <td>2</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>Sourcer</td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>1069385.0</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>伊顿中国</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5bfe9df574719d2aa34b7b2203a.png</td>\n",
       "      <td>https://www.liepin.com/company/1069385/</td>\n",
       "      <td>机械/设备</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"张先生\",\"imId\":\"4957d4f10187b67...</td>\n",
       "      <td>[]</td>\n",
       "      <td>40-70k·18薪</td>\n",
       "      <td>香港</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20230522113042</td>\n",
       "      <td>46316869</td>\n",
       "      <td>1</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>猎头顾问</td>\n",
       "      <td>5a95fa858e50c5b3522c209306a.png</td>\n",
       "      <td>NaN</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>某公募基金理财子公司</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td></td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"林女士\",\"imId\":\"e0944bb808b7f30...</td>\n",
       "      <td>[本科]</td>\n",
       "      <td>12-25k</td>\n",
       "      <td>香港-湾仔区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20210223134718</td>\n",
       "      <td>36105889</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td></td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>12208295.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>华润数科控股有限公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>616f846645a2627dc008eaa008u.png</td>\n",
       "      <td>https://www.liepin.com/company/12208295/</td>\n",
       "      <td>人工智能</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"陈女士\",\"imId\":\"391cce9e9c117e5...</td>\n",
       "      <td>[本科, 功能测试, 软件测试]</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230613110233</td>\n",
       "      <td>59283885</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>HR</td>\n",
       "      <td>63a26c44dab8425fae0e7e1b03u.png</td>\n",
       "      <td>9861675.0</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>成都无敌勇士科技有限公司</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>62b3ce0c8cd3bf59a05ff51d04u.png</td>\n",
       "      <td>https://www.liepin.com/company/9861675/</td>\n",
       "      <td>游戏</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"张女士\",\"imId\":\"1f106856e3e5293...</td>\n",
       "      <td>[本科, 软件测试, 应用测试, 功能测试, iOS, Android]</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230506100220</td>\n",
       "      <td>58318215</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td></td>\n",
       "      <td>5f8f986779c7cc70efbf36c008u.jpg</td>\n",
       "      <td>13447701.0</td>\n",
       "      <td></td>\n",
       "      <td>Winner Studio</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13447701/</td>\n",
       "      <td>游戏</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"石女士\",\"imId\":\"1b3d0b15ea2bc13...</td>\n",
       "      <td>[本科]</td>\n",
       "      <td>20-21k</td>\n",
       "      <td>香港-油尖旺区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230614100413</td>\n",
       "      <td>57158615</td>\n",
       "      <td>6</td>\n",
       "      <td>False</td>\n",
       "      <td>...</td>\n",
       "      <td>senior recruiter</td>\n",
       "      <td>5f8f98648dbe6273dcf8515508u.jpg</td>\n",
       "      <td>2680101.0</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>阿特金斯</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5cd93b94501544662c710a6c05u.png</td>\n",
       "      <td>https://www.liepin.com/company/2680101/</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>109 rows × 32 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                             dataInfo  \\\n",
       "0   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "1   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "2   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "3   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "4   %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "..                                                ...   \n",
       "24  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "25  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "26  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "27  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "28  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "\n",
       "                                           dataParams  \\\n",
       "0   {\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...   \n",
       "1   {\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...   \n",
       "2   {\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...   \n",
       "3   {\"userId\":\"1efac136cbe60a32a3ebc0e282cc3953\",\"...   \n",
       "4   {\"userId\":\"8aca73f4bae4fc17102021541d30443c\",\"...   \n",
       "..                                                ...   \n",
       "24  {\"recruiterName\":\"张先生\",\"imId\":\"4957d4f10187b67...   \n",
       "25  {\"recruiterName\":\"林女士\",\"imId\":\"e0944bb808b7f30...   \n",
       "26  {\"recruiterName\":\"陈女士\",\"imId\":\"391cce9e9c117e5...   \n",
       "27  {\"recruiterName\":\"张女士\",\"imId\":\"1f106856e3e5293...   \n",
       "28  {\"recruiterName\":\"石女士\",\"imId\":\"1b3d0b15ea2bc13...   \n",
       "\n",
       "                                           job.labels  job.salary   job.dq  \\\n",
       "0   [金融产品, 征信行业, 金融行业, 金融理财/贷款, 批发/零售, 产品优化, 产品设计,...        薪资面议   香港-观塘区   \n",
       "1                  [IT互联网, SaaS产品, to B, 产品设计, 移动端产品]      25-40k   香港-观塘区   \n",
       "2                                                  []      40-60k   香港-观塘区   \n",
       "3                                        [交易产品, 金融行业]        薪资面议   香港-中西区   \n",
       "4                                                  []        薪资面议    香港-东区   \n",
       "..                                                ...         ...      ...   \n",
       "24                                                 []  40-70k·18薪       香港   \n",
       "25                                               [本科]      12-25k   香港-湾仔区   \n",
       "26                                   [本科, 功能测试, 软件测试]      20-25k       香港   \n",
       "27               [本科, 软件测试, 应用测试, 功能测试, iOS, Android]      20-25k    香港-东区   \n",
       "28                                               [本科]      20-21k  香港-油尖旺区   \n",
       "\n",
       "   job.requireWorkYears job.refreshTime job.jobId job.jobKind  job.topJob  \\\n",
       "0                  3-5年  20221118143443  51880109           2       False   \n",
       "1                 5-10年  20230602174402  58720383           2       False   \n",
       "2                  3-5年  20230602174402  58720027           2       False   \n",
       "3                 5-10年  20221230112638  55273999           2       False   \n",
       "4                 10年以上  20220810153828  51789749           2       False   \n",
       "..                  ...             ...       ...         ...         ...   \n",
       "24                5-10年  20230522113042  46316869           1       False   \n",
       "25                  NaN  20210223134718  36105889           6       False   \n",
       "26                  NaN  20230613110233  59283885           6       False   \n",
       "27                  NaN  20230506100220  58318215           6       False   \n",
       "28                  NaN  20230614100413  57158615           6       False   \n",
       "\n",
       "    ...    recruiter.recruiterTitle         recruiter.recruiterPhoto  \\\n",
       "0   ...                   人力资源经理/主管  5f8f9866dfb13a7dee342f1808u.jpg   \n",
       "1   ...  Talent Acquisition Manager  61e1521019ffac3de11dd5c403u.png   \n",
       "2   ...  Talent Acquisition Manager  61e1521019ffac3de11dd5c403u.png   \n",
       "3   ...                              5f8f9865ea60860b75384fa508u.jpg   \n",
       "4   ...                     Sourcer  5f8f9865ea60860b75384fa508u.jpg   \n",
       "..  ...                         ...                              ...   \n",
       "24  ...                        猎头顾问  5a95fa858e50c5b3522c209306a.png   \n",
       "25  ...                              5f8f9866dfb13a7dee342f1808u.jpg   \n",
       "26  ...                          HR  63a26c44dab8425fae0e7e1b03u.png   \n",
       "27  ...                              5f8f986779c7cc70efbf36c008u.jpg   \n",
       "28  ...            senior recruiter  5f8f98648dbe6273dcf8515508u.jpg   \n",
       "\n",
       "   comp.compId comp.compScale                  comp.compName comp.compStage  \\\n",
       "0    8226823.0     2000-5000人                          金融壹账通           美股上市   \n",
       "1   13057723.0         50-99人  KPay merchant service limited            NaN   \n",
       "2   13057723.0         50-99人  KPay merchant service limited            NaN   \n",
       "3    4580900.0    5000-10000人                   中国国际金融股份有限公司         沪深A股上市   \n",
       "4    1069385.0       10000人以上                           伊顿中国            NaN   \n",
       "..         ...            ...                            ...            ...   \n",
       "24         NaN       500-999人                     某公募基金理财子公司          融资未公开   \n",
       "25  12208295.0     2000-5000人                     华润数科控股有限公司            NaN   \n",
       "26   9861675.0       100-499人                   成都无敌勇士科技有限公司          融资未公开   \n",
       "27  13447701.0                                 Winner Studio            NaN   \n",
       "28   2680101.0       100-499人                           阿特金斯            NaN   \n",
       "\n",
       "                      comp.compLogo                                 comp.link  \\\n",
       "0   5f3ca396ea60860b75020faa02u.jpg   https://www.liepin.com/company/8226823/   \n",
       "1   61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13057723/   \n",
       "2   61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13057723/   \n",
       "3   5bcd8a2f8e50a3257f7102c304a.jpg   https://www.liepin.com/company/4580900/   \n",
       "4   5bfe9df574719d2aa34b7b2203a.png   https://www.liepin.com/company/1069385/   \n",
       "..                              ...                                       ...   \n",
       "24  60e2fe0bf3df194a3c48adb502u.png                                             \n",
       "25  616f846645a2627dc008eaa008u.png  https://www.liepin.com/company/12208295/   \n",
       "26  62b3ce0c8cd3bf59a05ff51d04u.png   https://www.liepin.com/company/9861675/   \n",
       "27  61b07937d0458d53c627567e02u.jpg  https://www.liepin.com/company/13447701/   \n",
       "28  5cd93b94501544662c710a6c05u.png   https://www.liepin.com/company/2680101/   \n",
       "\n",
       "   comp.compIndustry job.campusJobKind  \n",
       "0               科技金融               NaN  \n",
       "1               科技金融               NaN  \n",
       "2               科技金融               NaN  \n",
       "3           基金/证券/期货               NaN  \n",
       "4              机械/设备               NaN  \n",
       "..               ...               ...  \n",
       "24          基金/证券/投资               NaN  \n",
       "25              人工智能                应届  \n",
       "26                游戏                应届  \n",
       "27                游戏                应届  \n",
       "28           房地产开发经营                应届  \n",
       "\n",
       "[109 rows x 32 columns]"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.concat(response_df)\r\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:03:00.420370Z",
     "iopub.status.busy": "2023-06-14T09:03:00.419741Z",
     "iopub.status.idle": "2023-06-14T09:03:00.426357Z",
     "shell.execute_reply": "2023-06-14T09:03:00.425457Z",
     "shell.execute_reply.started": "2023-06-14T09:03:00.420335Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'产品经理'"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "key = payload['data']['mainSearchPcConditionForm']['key']\r\n",
    "key"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 数据存储"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:03:36.545799Z",
     "iopub.status.busy": "2023-06-14T09:03:36.545230Z",
     "iopub.status.idle": "2023-06-14T09:03:36.549687Z",
     "shell.execute_reply": "2023-06-14T09:03:36.548875Z",
     "shell.execute_reply.started": "2023-06-14T09:03:36.545763Z"
    },
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "import time"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:03:50.929188Z",
     "iopub.status.busy": "2023-06-14T09:03:50.927869Z",
     "iopub.status.idle": "2023-06-14T09:03:50.935071Z",
     "shell.execute_reply": "2023-06-14T09:03:50.934033Z",
     "shell.execute_reply.started": "2023-06-14T09:03:50.929140Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "time.struct_time(tm_year=2023, tm_mon=6, tm_mday=14, tm_hour=17, tm_min=3, tm_sec=50, tm_wday=2, tm_yday=165, tm_isdst=0)"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "time.localtime()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:04:06.724484Z",
     "iopub.status.busy": "2023-06-14T09:04:06.723916Z",
     "iopub.status.idle": "2023-06-14T09:04:06.730848Z",
     "shell.execute_reply": "2023-06-14T09:04:06.730032Z",
     "shell.execute_reply.started": "2023-06-14T09:04:06.724451Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'614_174'"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "output_time = str(time.localtime().tm_mon)\\\r\n",
    "             +str(time.localtime().tm_mday)+'_'\\\r\n",
    "             +str(time.localtime().tm_hour) \\\r\n",
    "             +str(time.localtime().tm_min)\r\n",
    "output_time "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:04:23.047319Z",
     "iopub.status.busy": "2023-06-14T09:04:23.046735Z",
     "iopub.status.idle": "2023-06-14T09:04:23.225878Z",
     "shell.execute_reply": "2023-06-14T09:04:23.224646Z",
     "shell.execute_reply.started": "2023-06-14T09:04:23.047281Z"
    },
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "# 按照职位名称和时间导出文件\r\n",
    "df.to_excel( key +'_liepin_'+output_time+'.xlsx')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 数据分析\n",
    "\n",
    "> 1. Pandas/Numpy\n",
    "> 2. Pyecharts(bokeh、matplotlab、seaborn、echarts、Tebleau)/更考虑用户的体验"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:05:04.411956Z",
     "iopub.status.busy": "2023-06-14T09:05:04.411332Z",
     "iopub.status.idle": "2023-06-14T09:05:04.416077Z",
     "shell.execute_reply": "2023-06-14T09:05:04.415205Z",
     "shell.execute_reply.started": "2023-06-14T09:05:04.411923Z"
    },
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:05:14.506810Z",
     "iopub.status.busy": "2023-06-14T09:05:14.506092Z",
     "iopub.status.idle": "2023-06-14T09:05:14.601364Z",
     "shell.execute_reply": "2023-06-14T09:05:14.600444Z",
     "shell.execute_reply.started": "2023-06-14T09:05:14.506764Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>dataInfo</th>\n",
       "      <th>dataParams</th>\n",
       "      <th>job.labels</th>\n",
       "      <th>job.salary</th>\n",
       "      <th>job.dq</th>\n",
       "      <th>job.requireWorkYears</th>\n",
       "      <th>job.refreshTime</th>\n",
       "      <th>job.jobId</th>\n",
       "      <th>job.jobKind</th>\n",
       "      <th>...</th>\n",
       "      <th>recruiter.recruiterTitle</th>\n",
       "      <th>recruiter.recruiterPhoto</th>\n",
       "      <th>comp.compId</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.compStage</th>\n",
       "      <th>comp.compLogo</th>\n",
       "      <th>comp.link</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "      <th>job.campusJobKind</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...</td>\n",
       "      <td>['金融产品', '征信行业', '金融行业', '金融理财/贷款', '批发/零售', '...</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20221118143443</td>\n",
       "      <td>51880109</td>\n",
       "      <td>2</td>\n",
       "      <td>...</td>\n",
       "      <td>人力资源经理/主管</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>8226823.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>金融壹账通</td>\n",
       "      <td>美股上市</td>\n",
       "      <td>5f3ca396ea60860b75020faa02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/8226823/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...</td>\n",
       "      <td>['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']</td>\n",
       "      <td>25-40k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>58720383</td>\n",
       "      <td>2</td>\n",
       "      <td>...</td>\n",
       "      <td>Talent Acquisition Manager</td>\n",
       "      <td>61e1521019ffac3de11dd5c403u.png</td>\n",
       "      <td>13057723.0</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13057723/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...</td>\n",
       "      <td>[]</td>\n",
       "      <td>40-60k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>58720027</td>\n",
       "      <td>2</td>\n",
       "      <td>...</td>\n",
       "      <td>Talent Acquisition Manager</td>\n",
       "      <td>61e1521019ffac3de11dd5c403u.png</td>\n",
       "      <td>13057723.0</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13057723/</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"1efac136cbe60a32a3ebc0e282cc3953\",\"...</td>\n",
       "      <td>['交易产品', '金融行业']</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-中西区</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20221230112638</td>\n",
       "      <td>55273999</td>\n",
       "      <td>2</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>4580900.0</td>\n",
       "      <td>5000-10000人</td>\n",
       "      <td>中国国际金融股份有限公司</td>\n",
       "      <td>沪深A股上市</td>\n",
       "      <td>5bcd8a2f8e50a3257f7102c304a.jpg</td>\n",
       "      <td>https://www.liepin.com/company/4580900/</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"8aca73f4bae4fc17102021541d30443c\",\"...</td>\n",
       "      <td>[]</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>20220810153828</td>\n",
       "      <td>51789749</td>\n",
       "      <td>2</td>\n",
       "      <td>...</td>\n",
       "      <td>Sourcer</td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>1069385.0</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>伊顿中国</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5bfe9df574719d2aa34b7b2203a.png</td>\n",
       "      <td>https://www.liepin.com/company/1069385/</td>\n",
       "      <td>机械/设备</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>104</th>\n",
       "      <td>24</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"张先生\",\"imId\":\"4957d4f10187b67...</td>\n",
       "      <td>[]</td>\n",
       "      <td>40-70k·18薪</td>\n",
       "      <td>香港</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20230522113042</td>\n",
       "      <td>46316869</td>\n",
       "      <td>1</td>\n",
       "      <td>...</td>\n",
       "      <td>猎头顾问</td>\n",
       "      <td>5a95fa858e50c5b3522c209306a.png</td>\n",
       "      <td>NaN</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>某公募基金理财子公司</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td>NaN</td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>105</th>\n",
       "      <td>25</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"林女士\",\"imId\":\"e0944bb808b7f30...</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>12-25k</td>\n",
       "      <td>香港-湾仔区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20210223134718</td>\n",
       "      <td>36105889</td>\n",
       "      <td>6</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>12208295.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>华润数科控股有限公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>616f846645a2627dc008eaa008u.png</td>\n",
       "      <td>https://www.liepin.com/company/12208295/</td>\n",
       "      <td>人工智能</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>106</th>\n",
       "      <td>26</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"陈女士\",\"imId\":\"391cce9e9c117e5...</td>\n",
       "      <td>['本科', '功能测试', '软件测试']</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230613110233</td>\n",
       "      <td>59283885</td>\n",
       "      <td>6</td>\n",
       "      <td>...</td>\n",
       "      <td>HR</td>\n",
       "      <td>63a26c44dab8425fae0e7e1b03u.png</td>\n",
       "      <td>9861675.0</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>成都无敌勇士科技有限公司</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>62b3ce0c8cd3bf59a05ff51d04u.png</td>\n",
       "      <td>https://www.liepin.com/company/9861675/</td>\n",
       "      <td>游戏</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>107</th>\n",
       "      <td>27</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"张女士\",\"imId\":\"1f106856e3e5293...</td>\n",
       "      <td>['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230506100220</td>\n",
       "      <td>58318215</td>\n",
       "      <td>6</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5f8f986779c7cc70efbf36c008u.jpg</td>\n",
       "      <td>13447701.0</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Winner Studio</td>\n",
       "      <td>NaN</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>https://www.liepin.com/company/13447701/</td>\n",
       "      <td>游戏</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>108</th>\n",
       "      <td>28</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"石女士\",\"imId\":\"1b3d0b15ea2bc13...</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>20-21k</td>\n",
       "      <td>香港-油尖旺区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>20230614100413</td>\n",
       "      <td>57158615</td>\n",
       "      <td>6</td>\n",
       "      <td>...</td>\n",
       "      <td>senior recruiter</td>\n",
       "      <td>5f8f98648dbe6273dcf8515508u.jpg</td>\n",
       "      <td>2680101.0</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>阿特金斯</td>\n",
       "      <td>NaN</td>\n",
       "      <td>5cd93b94501544662c710a6c05u.png</td>\n",
       "      <td>https://www.liepin.com/company/2680101/</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>应届</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>109 rows × 33 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                                           dataInfo  \\\n",
       "0             0  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "1             1  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "2             2  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "3             3  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "4             4  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "..          ...                                                ...   \n",
       "104          24  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "105          25  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "106          26  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "107          27  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "108          28  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "\n",
       "                                            dataParams  \\\n",
       "0    {\"userId\":\"07bc072f44dc45b06882c0069b0a733a\",\"...   \n",
       "1    {\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...   \n",
       "2    {\"userId\":\"3893707b7534cc7459557d9eb7993d2f\",\"...   \n",
       "3    {\"userId\":\"1efac136cbe60a32a3ebc0e282cc3953\",\"...   \n",
       "4    {\"userId\":\"8aca73f4bae4fc17102021541d30443c\",\"...   \n",
       "..                                                 ...   \n",
       "104  {\"recruiterName\":\"张先生\",\"imId\":\"4957d4f10187b67...   \n",
       "105  {\"recruiterName\":\"林女士\",\"imId\":\"e0944bb808b7f30...   \n",
       "106  {\"recruiterName\":\"陈女士\",\"imId\":\"391cce9e9c117e5...   \n",
       "107  {\"recruiterName\":\"张女士\",\"imId\":\"1f106856e3e5293...   \n",
       "108  {\"recruiterName\":\"石女士\",\"imId\":\"1b3d0b15ea2bc13...   \n",
       "\n",
       "                                            job.labels  job.salary   job.dq  \\\n",
       "0    ['金融产品', '征信行业', '金融行业', '金融理财/贷款', '批发/零售', '...        薪资面议   香港-观塘区   \n",
       "1         ['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']      25-40k   香港-观塘区   \n",
       "2                                                   []      40-60k   香港-观塘区   \n",
       "3                                     ['交易产品', '金融行业']        薪资面议   香港-中西区   \n",
       "4                                                   []        薪资面议    香港-东区   \n",
       "..                                                 ...         ...      ...   \n",
       "104                                                 []  40-70k·18薪       香港   \n",
       "105                                             ['本科']      12-25k   香港-湾仔区   \n",
       "106                             ['本科', '功能测试', '软件测试']      20-25k       香港   \n",
       "107   ['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']      20-25k    香港-东区   \n",
       "108                                             ['本科']      20-21k  香港-油尖旺区   \n",
       "\n",
       "    job.requireWorkYears  job.refreshTime  job.jobId  job.jobKind  ...  \\\n",
       "0                   3-5年   20221118143443   51880109            2  ...   \n",
       "1                  5-10年   20230602174402   58720383            2  ...   \n",
       "2                   3-5年   20230602174402   58720027            2  ...   \n",
       "3                  5-10年   20221230112638   55273999            2  ...   \n",
       "4                  10年以上   20220810153828   51789749            2  ...   \n",
       "..                   ...              ...        ...          ...  ...   \n",
       "104                5-10年   20230522113042   46316869            1  ...   \n",
       "105                  NaN   20210223134718   36105889            6  ...   \n",
       "106                  NaN   20230613110233   59283885            6  ...   \n",
       "107                  NaN   20230506100220   58318215            6  ...   \n",
       "108                  NaN   20230614100413   57158615            6  ...   \n",
       "\n",
       "       recruiter.recruiterTitle         recruiter.recruiterPhoto comp.compId  \\\n",
       "0                     人力资源经理/主管  5f8f9866dfb13a7dee342f1808u.jpg   8226823.0   \n",
       "1    Talent Acquisition Manager  61e1521019ffac3de11dd5c403u.png  13057723.0   \n",
       "2    Talent Acquisition Manager  61e1521019ffac3de11dd5c403u.png  13057723.0   \n",
       "3                           NaN  5f8f9865ea60860b75384fa508u.jpg   4580900.0   \n",
       "4                       Sourcer  5f8f9865ea60860b75384fa508u.jpg   1069385.0   \n",
       "..                          ...                              ...         ...   \n",
       "104                        猎头顾问  5a95fa858e50c5b3522c209306a.png         NaN   \n",
       "105                         NaN  5f8f9866dfb13a7dee342f1808u.jpg  12208295.0   \n",
       "106                          HR  63a26c44dab8425fae0e7e1b03u.png   9861675.0   \n",
       "107                         NaN  5f8f986779c7cc70efbf36c008u.jpg  13447701.0   \n",
       "108            senior recruiter  5f8f98648dbe6273dcf8515508u.jpg   2680101.0   \n",
       "\n",
       "    comp.compScale                  comp.compName  comp.compStage  \\\n",
       "0       2000-5000人                          金融壹账通            美股上市   \n",
       "1           50-99人  KPay merchant service limited             NaN   \n",
       "2           50-99人  KPay merchant service limited             NaN   \n",
       "3      5000-10000人                   中国国际金融股份有限公司          沪深A股上市   \n",
       "4         10000人以上                           伊顿中国             NaN   \n",
       "..             ...                            ...             ...   \n",
       "104       500-999人                     某公募基金理财子公司           融资未公开   \n",
       "105     2000-5000人                     华润数科控股有限公司             NaN   \n",
       "106       100-499人                   成都无敌勇士科技有限公司           融资未公开   \n",
       "107            NaN                  Winner Studio             NaN   \n",
       "108       100-499人                           阿特金斯             NaN   \n",
       "\n",
       "                       comp.compLogo  \\\n",
       "0    5f3ca396ea60860b75020faa02u.jpg   \n",
       "1    61b07937d0458d53c627567e02u.jpg   \n",
       "2    61b07937d0458d53c627567e02u.jpg   \n",
       "3    5bcd8a2f8e50a3257f7102c304a.jpg   \n",
       "4    5bfe9df574719d2aa34b7b2203a.png   \n",
       "..                               ...   \n",
       "104  60e2fe0bf3df194a3c48adb502u.png   \n",
       "105  616f846645a2627dc008eaa008u.png   \n",
       "106  62b3ce0c8cd3bf59a05ff51d04u.png   \n",
       "107  61b07937d0458d53c627567e02u.jpg   \n",
       "108  5cd93b94501544662c710a6c05u.png   \n",
       "\n",
       "                                    comp.link  comp.compIndustry  \\\n",
       "0     https://www.liepin.com/company/8226823/               科技金融   \n",
       "1    https://www.liepin.com/company/13057723/               科技金融   \n",
       "2    https://www.liepin.com/company/13057723/               科技金融   \n",
       "3     https://www.liepin.com/company/4580900/           基金/证券/期货   \n",
       "4     https://www.liepin.com/company/1069385/              机械/设备   \n",
       "..                                        ...                ...   \n",
       "104                                       NaN           基金/证券/投资   \n",
       "105  https://www.liepin.com/company/12208295/               人工智能   \n",
       "106   https://www.liepin.com/company/9861675/                 游戏   \n",
       "107  https://www.liepin.com/company/13447701/                 游戏   \n",
       "108   https://www.liepin.com/company/2680101/            房地产开发经营   \n",
       "\n",
       "    job.campusJobKind  \n",
       "0                 NaN  \n",
       "1                 NaN  \n",
       "2                 NaN  \n",
       "3                 NaN  \n",
       "4                 NaN  \n",
       "..                ...  \n",
       "104               NaN  \n",
       "105                应届  \n",
       "106                应届  \n",
       "107                应届  \n",
       "108                应届  \n",
       "\n",
       "[109 rows x 33 columns]"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.read_excel(key+'_liepin_'+output_time+'.xlsx')\r\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:57:44.685760Z",
     "iopub.status.busy": "2023-06-14T09:57:44.684924Z",
     "iopub.status.idle": "2023-06-14T09:57:44.698831Z",
     "shell.execute_reply": "2023-06-14T09:57:44.697756Z",
     "shell.execute_reply.started": "2023-06-14T09:57:44.685721Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'pandas.core.frame.DataFrame'>\r\n",
      "RangeIndex: 109 entries, 0 to 108\r\n",
      "Data columns (total 33 columns):\r\n",
      " #   Column                    Non-Null Count  Dtype  \r\n",
      "---  ------                    --------------  -----  \r\n",
      " 0   Unnamed: 0                109 non-null    int64  \r\n",
      " 1   dataInfo                  109 non-null    object \r\n",
      " 2   dataParams                109 non-null    object \r\n",
      " 3   job.labels                109 non-null    object \r\n",
      " 4   job.salary                109 non-null    object \r\n",
      " 5   job.dq                    109 non-null    object \r\n",
      " 6   job.requireWorkYears      105 non-null    object \r\n",
      " 7   job.refreshTime           109 non-null    int64  \r\n",
      " 8   job.jobId                 109 non-null    int64  \r\n",
      " 9   job.jobKind               109 non-null    int64  \r\n",
      " 10  job.topJob                109 non-null    bool   \r\n",
      " 11  job.advViewFlag           109 non-null    bool   \r\n",
      " 12  job.title                 109 non-null    object \r\n",
      " 13  job.link                  109 non-null    object \r\n",
      " 14  job.dataPromId            109 non-null    object \r\n",
      " 15  job.pcOuterLink           0 non-null      float64\r\n",
      " 16  job.h5OuterLink           0 non-null      float64\r\n",
      " 17  job.requireEduLevel       105 non-null    object \r\n",
      " 18  recruiter.chatted         109 non-null    bool   \r\n",
      " 19  recruiter.imId            109 non-null    object \r\n",
      " 20  recruiter.imUserType      109 non-null    int64  \r\n",
      " 21  recruiter.recruiterId     109 non-null    object \r\n",
      " 22  recruiter.recruiterName   109 non-null    object \r\n",
      " 23  recruiter.recruiterTitle  88 non-null     object \r\n",
      " 24  recruiter.recruiterPhoto  109 non-null    object \r\n",
      " 25  comp.compId               77 non-null     float64\r\n",
      " 26  comp.compScale            100 non-null    object \r\n",
      " 27  comp.compName             109 non-null    object \r\n",
      " 28  comp.compStage            47 non-null     object \r\n",
      " 29  comp.compLogo             109 non-null    object \r\n",
      " 30  comp.link                 77 non-null     object \r\n",
      " 31  comp.compIndustry         109 non-null    object \r\n",
      " 32  job.campusJobKind         4 non-null      object \r\n",
      "dtypes: bool(3), float64(3), int64(5), object(22)\r\n",
      "memory usage: 26.0+ KB\r\n"
     ]
    }
   ],
   "source": [
    "df.info()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 筛选存在数据分析价值的列"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:57:46.948046Z",
     "iopub.status.busy": "2023-06-14T09:57:46.947110Z",
     "iopub.status.idle": "2023-06-14T09:57:46.970901Z",
     "shell.execute_reply": "2023-06-14T09:57:46.970117Z",
     "shell.execute_reply.started": "2023-06-14T09:57:46.948006Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>job.labels</th>\n",
       "      <th>job.refreshTime</th>\n",
       "      <th>job.title</th>\n",
       "      <th>job.salary</th>\n",
       "      <th>job.dq</th>\n",
       "      <th>job.topJob</th>\n",
       "      <th>job.requireWorkYears</th>\n",
       "      <th>job.requireEduLevel</th>\n",
       "      <th>comp.compStage</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "      <th>comp.compScale</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>['金融产品', '征信行业', '金融行业', '金融理财/贷款', '批发/零售', '...</td>\n",
       "      <td>20221118143443</td>\n",
       "      <td>产品经理 Product Manager</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>美股上市</td>\n",
       "      <td>金融壹账通</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>2000-5000人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>产品经理 (Senior) Product Manager</td>\n",
       "      <td>25-40k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>50-99人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>产品市场经理 Product Marketing Manager</td>\n",
       "      <td>40-60k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>50-99人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>['交易产品', '金融行业']</td>\n",
       "      <td>20221230112638</td>\n",
       "      <td>产品经理-海外交易柜台方向</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-中西区</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>硕士</td>\n",
       "      <td>沪深A股上市</td>\n",
       "      <td>中国国际金融股份有限公司</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>5000-10000人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>[]</td>\n",
       "      <td>20220810153828</td>\n",
       "      <td>Product Manager-Film Capacitor/Polymer Capacitor</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>False</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>伊顿中国</td>\n",
       "      <td>机械/设备</td>\n",
       "      <td>10000人以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>104</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230522113042</td>\n",
       "      <td>风险合规经理（离岸财富管理产品）</td>\n",
       "      <td>40-70k·18薪</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>某公募基金理财子公司</td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>500-999人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>105</th>\n",
       "      <td>['本科']</td>\n",
       "      <td>20210223134718</td>\n",
       "      <td>产品经理</td>\n",
       "      <td>12-25k</td>\n",
       "      <td>香港-湾仔区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>华润数科控股有限公司</td>\n",
       "      <td>人工智能</td>\n",
       "      <td>2000-5000人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>106</th>\n",
       "      <td>['本科', '功能测试', '软件测试']</td>\n",
       "      <td>20230613110233</td>\n",
       "      <td>软件测试应届生（23届）</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>成都无敌勇士科技有限公司</td>\n",
       "      <td>游戏</td>\n",
       "      <td>100-499人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>107</th>\n",
       "      <td>['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']</td>\n",
       "      <td>20230506100220</td>\n",
       "      <td>APP测试工程师</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Winner Studio</td>\n",
       "      <td>游戏</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>108</th>\n",
       "      <td>['本科']</td>\n",
       "      <td>20230614100413</td>\n",
       "      <td>Graduate Engineer (Civil and MEP Engineering)</td>\n",
       "      <td>20-21k</td>\n",
       "      <td>香港-油尖旺区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>阿特金斯</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>100-499人</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>109 rows × 12 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                            job.labels  job.refreshTime  \\\n",
       "0    ['金融产品', '征信行业', '金融行业', '金融理财/贷款', '批发/零售', '...   20221118143443   \n",
       "1         ['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']   20230602174402   \n",
       "2                                                   []   20230602174402   \n",
       "3                                     ['交易产品', '金融行业']   20221230112638   \n",
       "4                                                   []   20220810153828   \n",
       "..                                                 ...              ...   \n",
       "104                                                 []   20230522113042   \n",
       "105                                             ['本科']   20210223134718   \n",
       "106                             ['本科', '功能测试', '软件测试']   20230613110233   \n",
       "107   ['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']   20230506100220   \n",
       "108                                             ['本科']   20230614100413   \n",
       "\n",
       "                                            job.title  job.salary   job.dq  \\\n",
       "0                                产品经理 Product Manager        薪资面议   香港-观塘区   \n",
       "1                       产品经理 (Senior) Product Manager      25-40k   香港-观塘区   \n",
       "2                    产品市场经理 Product Marketing Manager      40-60k   香港-观塘区   \n",
       "3                                       产品经理-海外交易柜台方向        薪资面议   香港-中西区   \n",
       "4    Product Manager-Film Capacitor/Polymer Capacitor        薪资面议    香港-东区   \n",
       "..                                                ...         ...      ...   \n",
       "104                                  风险合规经理（离岸财富管理产品）  40-70k·18薪       香港   \n",
       "105                                              产品经理      12-25k   香港-湾仔区   \n",
       "106                                      软件测试应届生（23届）      20-25k       香港   \n",
       "107                                          APP测试工程师      20-25k    香港-东区   \n",
       "108     Graduate Engineer (Civil and MEP Engineering)      20-21k  香港-油尖旺区   \n",
       "\n",
       "     job.topJob job.requireWorkYears job.requireEduLevel comp.compStage  \\\n",
       "0         False                 3-5年                统招本科           美股上市   \n",
       "1         False                5-10年                  本科            NaN   \n",
       "2         False                 3-5年                  本科            NaN   \n",
       "3         False                5-10年                  硕士         沪深A股上市   \n",
       "4         False                10年以上                统招本科            NaN   \n",
       "..          ...                  ...                 ...            ...   \n",
       "104       False                5-10年               硕士及以上          融资未公开   \n",
       "105       False                  NaN                 NaN            NaN   \n",
       "106       False                  NaN                 NaN          融资未公开   \n",
       "107       False                  NaN                 NaN            NaN   \n",
       "108       False                  NaN                 NaN            NaN   \n",
       "\n",
       "                     comp.compName comp.compIndustry comp.compScale  \n",
       "0                            金融壹账通              科技金融     2000-5000人  \n",
       "1    KPay merchant service limited              科技金融         50-99人  \n",
       "2    KPay merchant service limited              科技金融         50-99人  \n",
       "3                     中国国际金融股份有限公司          基金/证券/期货    5000-10000人  \n",
       "4                             伊顿中国             机械/设备       10000人以上  \n",
       "..                             ...               ...            ...  \n",
       "104                     某公募基金理财子公司          基金/证券/投资       500-999人  \n",
       "105                     华润数科控股有限公司              人工智能     2000-5000人  \n",
       "106                   成都无敌勇士科技有限公司                游戏       100-499人  \n",
       "107                  Winner Studio                游戏            NaN  \n",
       "108                           阿特金斯           房地产开发经营       100-499人  \n",
       "\n",
       "[109 rows x 12 columns]"
      ]
     },
     "execution_count": 33,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz =  df[['job.labels','job.refreshTime','job.title','job.salary','job.dq','job.topJob','job.requireWorkYears','job.requireEduLevel','comp.compStage','comp.compName','comp.compIndustry','comp.compScale']]\n",
    "df_PM_gz"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 广州的PM地区分布"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:57:49.523595Z",
     "iopub.status.busy": "2023-06-14T09:57:49.522965Z",
     "iopub.status.idle": "2023-06-14T09:57:49.532353Z",
     "shell.execute_reply": "2023-06-14T09:57:49.531510Z",
     "shell.execute_reply.started": "2023-06-14T09:57:49.523563Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "香港         41\n",
       "香港-葵青区     17\n",
       "香港-湾仔区     15\n",
       "香港-中西区     12\n",
       "香港-观塘区      6\n",
       "香港-东区       5\n",
       "香港-油尖旺区     3\n",
       "香港-沙田区      3\n",
       "香港-元朗区      2\n",
       "香港-西贡区      2\n",
       "香港-荃湾区      1\n",
       "香港-深水埗区     1\n",
       "香港-九龙城区     1\n",
       "Name: job.dq, dtype: int64"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['job.dq'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:00:35.051639Z",
     "iopub.status.busy": "2023-06-14T10:00:35.051127Z",
     "iopub.status.idle": "2023-06-14T10:00:35.058315Z",
     "shell.execute_reply": "2023-06-14T10:00:35.057495Z",
     "shell.execute_reply.started": "2023-06-14T10:00:35.051607Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['香港',\n",
       " '香港-葵青区',\n",
       " '香港-湾仔区',\n",
       " '香港-中西区',\n",
       " '香港-观塘区',\n",
       " '香港-东区',\n",
       " '香港-油尖旺区',\n",
       " '香港-沙田区',\n",
       " '香港-元朗区',\n",
       " '香港-西贡区',\n",
       " '香港-荃湾区',\n",
       " '香港-深水埗区',\n",
       " '香港-九龙城区']"
      ]
     },
     "execution_count": 36,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['job.dq'].value_counts().index.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T09:57:51.733591Z",
     "iopub.status.busy": "2023-06-14T09:57:51.732592Z",
     "iopub.status.idle": "2023-06-14T09:57:51.740734Z",
     "shell.execute_reply": "2023-06-14T09:57:51.740007Z",
     "shell.execute_reply.started": "2023-06-14T09:57:51.733551Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['葵青区',\n",
       " '湾仔区',\n",
       " '中西区',\n",
       " '观塘区',\n",
       " '东区',\n",
       " '油尖旺区',\n",
       " '沙田区',\n",
       " '元朗区',\n",
       " '西贡区',\n",
       " '荃湾区',\n",
       " '深水埗区',\n",
       " '九龙城区']"
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "广州地区 = [  i.split('-')[1]       for i in df_PM_gz['job.dq'].value_counts().index.tolist()[1:]]\n",
    "广州地区"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:46:43.654049Z",
     "iopub.status.busy": "2023-05-31T12:46:43.653458Z",
     "iopub.status.idle": "2023-05-31T12:46:43.660976Z",
     "shell.execute_reply": "2023-05-31T12:46:43.660262Z",
     "shell.execute_reply.started": "2023-05-31T12:46:43.654007Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[8, 6, 4, 3, 1, 1, 1, 1]"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "广州_岗位个数 = df_PM_gz['job.dq'].value_counts().values.tolist()[1:]\n",
    "广州_岗位个数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:46:48.119036Z",
     "iopub.status.busy": "2023-05-31T12:46:48.118708Z",
     "iopub.status.idle": "2023-05-31T12:46:48.302915Z",
     "shell.execute_reply": "2023-05-31T12:46:48.302055Z",
     "shell.execute_reply.started": "2023-05-31T12:46:48.119004Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "<script>\n",
       "    require.config({\n",
       "        paths: {\n",
       "            'echarts':'https://assets.pyecharts.org/assets/v5/echarts.min', '广州':'https://assets.pyecharts.org/assets/v5/maps/guang3_dong1_guang3_zhou1'\n",
       "        }\n",
       "    });\n",
       "</script>\n",
       "\n",
       "        <div id=\"187c624657614622859d063a8c9d4586\" style=\"width:900px; height:500px;\"></div>\n",
       "\n",
       "<script>\n",
       "        require(['echarts', '广州'], function(echarts) {\n",
       "                var chart_187c624657614622859d063a8c9d4586 = echarts.init(\n",
       "                    document.getElementById('187c624657614622859d063a8c9d4586'), 'white', {renderer: 'canvas'});\n",
       "                var option_187c624657614622859d063a8c9d4586 = {\n",
       "    \"animation\": true,\n",
       "    \"animationThreshold\": 2000,\n",
       "    \"animationDuration\": 1000,\n",
       "    \"animationEasing\": \"cubicOut\",\n",
       "    \"animationDelay\": 0,\n",
       "    \"animationDurationUpdate\": 300,\n",
       "    \"animationEasingUpdate\": \"cubicOut\",\n",
       "    \"animationDelayUpdate\": 0,\n",
       "    \"aria\": {\n",
       "        \"enabled\": false\n",
       "    },\n",
       "    \"color\": [\n",
       "        \"#5470c6\",\n",
       "        \"#91cc75\",\n",
       "        \"#fac858\",\n",
       "        \"#ee6666\",\n",
       "        \"#73c0de\",\n",
       "        \"#3ba272\",\n",
       "        \"#fc8452\",\n",
       "        \"#9a60b4\",\n",
       "        \"#ea7ccc\"\n",
       "    ],\n",
       "    \"series\": [\n",
       "        {\n",
       "            \"type\": \"map\",\n",
       "            \"name\": \"\\u5546\\u5bb6A\",\n",
       "            \"label\": {\n",
       "                \"show\": true,\n",
       "                \"margin\": 8\n",
       "            },\n",
       "            \"map\": \"\\u5e7f\\u5dde\",\n",
       "            \"data\": [\n",
       "                {\n",
       "                    \"name\": \"\\u6d77\\u73e0\\u533a\",\n",
       "                    \"value\": 8\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u5929\\u6cb3\\u533a\",\n",
       "                    \"value\": 6\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u756a\\u79ba\\u533a\",\n",
       "                    \"value\": 4\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u767d\\u4e91\\u533a\",\n",
       "                    \"value\": 3\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u8354\\u6e7e\\u533a\",\n",
       "                    \"value\": 1\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u8d8a\\u79c0\\u533a\",\n",
       "                    \"value\": 1\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u9ec4\\u57d4\\u533a\",\n",
       "                    \"value\": 1\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"\\u5357\\u6c99\\u533a\",\n",
       "                    \"value\": 1\n",
       "                }\n",
       "            ],\n",
       "            \"roam\": true,\n",
       "            \"aspectScale\": 0.75,\n",
       "            \"nameProperty\": \"name\",\n",
       "            \"selectedMode\": false,\n",
       "            \"zoom\": 1,\n",
       "            \"zlevel\": 0,\n",
       "            \"z\": 2,\n",
       "            \"seriesLayoutBy\": \"column\",\n",
       "            \"datasetIndex\": 0,\n",
       "            \"mapValueCalculation\": \"sum\",\n",
       "            \"showLegendSymbol\": true,\n",
       "            \"emphasis\": {}\n",
       "        }\n",
       "    ],\n",
       "    \"legend\": [\n",
       "        {\n",
       "            \"data\": [\n",
       "                \"\\u5546\\u5bb6A\"\n",
       "            ],\n",
       "            \"selected\": {},\n",
       "            \"show\": true,\n",
       "            \"padding\": 5,\n",
       "            \"itemGap\": 10,\n",
       "            \"itemWidth\": 25,\n",
       "            \"itemHeight\": 14,\n",
       "            \"backgroundColor\": \"transparent\",\n",
       "            \"borderColor\": \"#ccc\",\n",
       "            \"borderWidth\": 1,\n",
       "            \"borderRadius\": 0,\n",
       "            \"pageButtonItemGap\": 5,\n",
       "            \"pageButtonPosition\": \"end\",\n",
       "            \"pageFormatter\": \"{current}/{total}\",\n",
       "            \"pageIconColor\": \"#2f4554\",\n",
       "            \"pageIconInactiveColor\": \"#aaa\",\n",
       "            \"pageIconSize\": 15,\n",
       "            \"animationDurationUpdate\": 800,\n",
       "            \"selector\": false,\n",
       "            \"selectorPosition\": \"auto\",\n",
       "            \"selectorItemGap\": 7,\n",
       "            \"selectorButtonGap\": 10\n",
       "        }\n",
       "    ],\n",
       "    \"tooltip\": {\n",
       "        \"show\": true,\n",
       "        \"trigger\": \"item\",\n",
       "        \"triggerOn\": \"mousemove|click\",\n",
       "        \"axisPointer\": {\n",
       "            \"type\": \"line\"\n",
       "        },\n",
       "        \"showContent\": true,\n",
       "        \"alwaysShowContent\": false,\n",
       "        \"showDelay\": 0,\n",
       "        \"hideDelay\": 100,\n",
       "        \"enterable\": false,\n",
       "        \"confine\": false,\n",
       "        \"appendToBody\": false,\n",
       "        \"transitionDuration\": 0.4,\n",
       "        \"textStyle\": {\n",
       "            \"fontSize\": 14\n",
       "        },\n",
       "        \"borderWidth\": 0,\n",
       "        \"padding\": 5,\n",
       "        \"order\": \"seriesAsc\"\n",
       "    },\n",
       "    \"title\": [\n",
       "        {\n",
       "            \"show\": true,\n",
       "            \"text\": \"Map-\\u5e7f\\u5dde\\u5730\\u56fe\",\n",
       "            \"target\": \"blank\",\n",
       "            \"subtarget\": \"blank\",\n",
       "            \"padding\": 5,\n",
       "            \"itemGap\": 10,\n",
       "            \"textAlign\": \"auto\",\n",
       "            \"textVerticalAlign\": \"auto\",\n",
       "            \"triggerEvent\": false\n",
       "        }\n",
       "    ],\n",
       "    \"visualMap\": {\n",
       "        \"show\": true,\n",
       "        \"type\": \"continuous\",\n",
       "        \"min\": 0,\n",
       "        \"max\": 100,\n",
       "        \"inRange\": {\n",
       "            \"color\": [\n",
       "                \"#50a3ba\",\n",
       "                \"#eac763\",\n",
       "                \"#d94e5d\"\n",
       "            ]\n",
       "        },\n",
       "        \"calculable\": true,\n",
       "        \"inverse\": false,\n",
       "        \"splitNumber\": 5,\n",
       "        \"hoverLink\": true,\n",
       "        \"orient\": \"vertical\",\n",
       "        \"padding\": 5,\n",
       "        \"showLabel\": true,\n",
       "        \"itemWidth\": 20,\n",
       "        \"itemHeight\": 140,\n",
       "        \"borderWidth\": 0\n",
       "    }\n",
       "};\n",
       "                chart_187c624657614622859d063a8c9d4586.setOption(option_187c624657614622859d063a8c9d4586);\n",
       "        });\n",
       "    </script>\n"
      ],
      "text/plain": [
       "<pyecharts.render.display.HTML at 0x7fa359569110>"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 可视化：以可视化工具数据形态符合的数据进行输入\n",
    "\n",
    "from pyecharts import options as opts\n",
    "from pyecharts.charts import Map\n",
    "from pyecharts.faker import Faker\n",
    "\n",
    "c = (\n",
    "    Map()\n",
    "    .add(\"商家A\", [list(z) for z in zip(广州地区, 广州_岗位个数)], \"广州\")\n",
    "    .set_global_opts(\n",
    "        title_opts=opts.TitleOpts(title=\"Map-广州地图\"), visualmap_opts=opts.VisualMapOpts()\n",
    "    )\n",
    "    \n",
    ")\n",
    "c.render_notebook()\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 职位分布\n",
    "\n",
    "* 知识点：dataframe字符串处理\n",
    "> 1. [pandas.series.str](https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.Series.str.html)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:01:46.809709Z",
     "iopub.status.busy": "2023-06-14T10:01:46.808973Z",
     "iopub.status.idle": "2023-06-14T10:01:46.816424Z",
     "shell.execute_reply": "2023-06-14T10:01:46.815741Z",
     "shell.execute_reply.started": "2023-06-14T10:01:46.809673Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0                                  产品经理 Product Manager\n",
       "1                         产品经理 (Senior) Product Manager\n",
       "2                      产品市场经理 Product Marketing Manager\n",
       "3                                         产品经理-海外交易柜台方向\n",
       "4      Product Manager-Film Capacitor/Polymer Capacitor\n",
       "                             ...                       \n",
       "104                                    风险合规经理（离岸财富管理产品）\n",
       "105                                                产品经理\n",
       "106                                        软件测试应届生（23届）\n",
       "107                                            APP测试工程师\n",
       "108       Graduate Engineer (Civil and MEP Engineering)\n",
       "Name: job.title, Length: 109, dtype: object"
      ]
     },
     "execution_count": 37,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['job.title']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:02:34.364417Z",
     "iopub.status.busy": "2023-06-14T10:02:34.363335Z",
     "iopub.status.idle": "2023-06-14T10:02:34.374770Z",
     "shell.execute_reply": "2023-06-14T10:02:34.373875Z",
     "shell.execute_reply.started": "2023-06-14T10:02:34.364367Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "12             金融产品经理\n",
       "23                   \n",
       "27                   \n",
       "29             【总行岗位】\n",
       "49     HCM产品行销经理\\售前顾问\n",
       "69         平台产品leader\n",
       "76          石油化工项目工程师\n",
       "82                   \n",
       "86       石油化工项目-设计工程师\n",
       "93         高级ICT技术经理 \n",
       "101             9号牌RO\n",
       "102            证券投资经理\n",
       "104            风险合规经理\n",
       "106           软件测试应届生\n",
       "Name: job.title, dtype: object"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 还要合并回去原来的行\n",
    "df_PM_gz['job.title'][   df_PM_gz['job.title'].str.contains('（')   ].str.split('（').apply(lambda x:x[0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:03:03.648024Z",
     "iopub.status.busy": "2023-06-14T10:03:03.647202Z",
     "iopub.status.idle": "2023-06-14T10:03:03.657626Z",
     "shell.execute_reply": "2023-06-14T10:03:03.656850Z",
     "shell.execute_reply.started": "2023-06-14T10:03:03.647990Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "产品经理                                    11\n",
       "产品经理                                     6\n",
       "                                         3\n",
       "金融产品经理                                   2\n",
       "海外对冲基金产品专家                               2\n",
       "                                        ..\n",
       "软件测试应届生                                  1\n",
       "HCM产品行销经理\\售前顾问                           1\n",
       "新产品发展经理                                  1\n",
       "Product Manager , Electronic Banking     1\n",
       "SaaS Product Manager                     1\n",
       "Name: job.title, Length: 85, dtype: int64"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 处理过一些，清洗后的数据\n",
    "df_job_title = df_PM_gz['job.title'].apply(lambda x:x.split('（')[0].split('/')[0].split('(')[0]).value_counts()\n",
    "df_job_title"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:03:13.203843Z",
     "iopub.status.busy": "2023-06-14T10:03:13.202810Z",
     "iopub.status.idle": "2023-06-14T10:03:13.210359Z",
     "shell.execute_reply": "2023-06-14T10:03:13.209386Z",
     "shell.execute_reply.started": "2023-06-14T10:03:13.203803Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['产品经理',\n",
       " '产品经理 ',\n",
       " '',\n",
       " '金融产品经理',\n",
       " '海外对冲基金产品专家',\n",
       " 'Account Manager',\n",
       " 'Product Manager ',\n",
       " '数字化产品经理',\n",
       " '业务流程岗',\n",
       " '产品岗',\n",
       " 'IoT solution & Device Product Manager',\n",
       " 'Sales and Marketing Director',\n",
       " 'Senior Program Manager - HK',\n",
       " '商务开发经理',\n",
       " 'EHS技术产品研发经理 EHS Solutions RD Manager',\n",
       " 'Product Manager- Fulfillment',\n",
       " 'HelpDesk技术支持',\n",
       " '石油化工项目工程师',\n",
       " '产品经理-海外交易柜台方向',\n",
       " 'Assistant Manager, Digital Marketing',\n",
       " '9号牌RO',\n",
       " '风险合规经理',\n",
       " '产品市场经理 Product Marketing Manager',\n",
       " 'Product Marketing Manager_Timing Devices',\n",
       " 'Project Engineer - Project Management and Service Access',\n",
       " '[量化]基金经理',\n",
       " '基金产品经理',\n",
       " 'Product Manager-Film Capacitor',\n",
       " '蚂蚁集团-产品专家-国际事业群',\n",
       " '售前产品经理',\n",
       " '基金产品总监',\n",
       " 'Product Manager - Transaction',\n",
       " '38518H-【CRA】数据资产管理经理',\n",
       " '销售代表',\n",
       " 'Digital Marketing Manager',\n",
       " '产品解决方案专家',\n",
       " '数据中心运营流程管理高级工程师',\n",
       " '境外-创新增长运营-香港、北京',\n",
       " '财富产品专家',\n",
       " '证券投资经理',\n",
       " 'QA测试工程师',\n",
       " '投资经理',\n",
       " 'APP测试工程师',\n",
       " ' IT Project Manager',\n",
       " '客户服务经理Product & Customer Service Manager',\n",
       " 'Global CTA PM ',\n",
       " '香港高级投资经理',\n",
       " 'Business Management Product Manager',\n",
       " 'Quantitative Portfolio Manager 量化投资基金经理 - SG',\n",
       " '石油化工项目-设计工程师',\n",
       " '结构化产品专家',\n",
       " '产品设计工程师',\n",
       " '云计算售前产品经理',\n",
       " 'Graduate Engineer ',\n",
       " '数字营销经理',\n",
       " '仓库文员',\n",
       " '5G Device Product Manager',\n",
       " '数据产品经理',\n",
       " '【总行岗位】',\n",
       " '\\xa090M0116548项目工程师',\n",
       " 'Associate, Product Development',\n",
       " '仓库组长',\n",
       " '南方基金香港子公司',\n",
       " 'Project Engineer at HK Site',\n",
       " '对冲基金产品专家',\n",
       " '境外-创新增长运营',\n",
       " 'Healthcare Analyst',\n",
       " '高级ICT技术经理 ',\n",
       " '平台产品leader',\n",
       " '助理产品经理',\n",
       " '38518G-【CRA】产品经理',\n",
       " '海外交易柜台产品经理',\n",
       " '产品经理 Product Manager',\n",
       " '期权产品经理',\n",
       " 'Project Document Controller at HK Site',\n",
       " '38518C-【CRA】征信模型设计',\n",
       " '海外对冲基金产品总监',\n",
       " '南方东英-固收交易员',\n",
       " '数字化转型',\n",
       " 'Project Design Engineer at HK Site',\n",
       " '软件测试应届生',\n",
       " 'HCM产品行销经理\\\\售前顾问',\n",
       " '新产品发展经理',\n",
       " 'Product Manager , Electronic Banking',\n",
       " 'SaaS Product Manager']"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_job_title.index.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:03:38.440940Z",
     "iopub.status.busy": "2023-06-14T10:03:38.440419Z",
     "iopub.status.idle": "2023-06-14T10:03:38.446092Z",
     "shell.execute_reply": "2023-06-14T10:03:38.445351Z",
     "shell.execute_reply.started": "2023-06-14T10:03:38.440910Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "85"
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(df_job_title.index.tolist())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:03:48.636244Z",
     "iopub.status.busy": "2023-06-14T10:03:48.635205Z",
     "iopub.status.idle": "2023-06-14T10:03:48.644355Z",
     "shell.execute_reply": "2023-06-14T10:03:48.643492Z",
     "shell.execute_reply.started": "2023-06-14T10:03:48.636194Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[11,\n",
       " 6,\n",
       " 3,\n",
       " 2,\n",
       " 2,\n",
       " 2,\n",
       " 2,\n",
       " 2,\n",
       " 2,\n",
       " 2,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1,\n",
       " 1]"
      ]
     },
     "execution_count": 42,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_job_title.values.tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:04:03.880889Z",
     "iopub.status.busy": "2023-06-14T10:04:03.879937Z",
     "iopub.status.idle": "2023-06-14T10:04:03.890896Z",
     "shell.execute_reply": "2023-06-14T10:04:03.889952Z",
     "shell.execute_reply.started": "2023-06-14T10:04:03.880841Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "产品经理                           10\n",
       "业务流程岗(J11204)                   2\n",
       "Account Manager                 2\n",
       "海外对冲基金产品专家                      2\n",
       "Product Manager (AD to Dir)     2\n",
       "                               ..\n",
       "境外-创新增长运营                       1\n",
       "5G Device Product Manager       1\n",
       "对冲基金产品专家                        1\n",
       "南方基金香港子公司(南方东英) 债券交易员           1\n",
       "38518C-【CRA】征信模型设计              1\n",
       "Name: job.title, Length: 95, dtype: int64"
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 未处理字符串的数据（不太整洁和干净的数据）\r\n",
    "df_PM_gz['job.title'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:46:52.879020Z",
     "iopub.status.busy": "2023-05-31T12:46:52.878471Z",
     "iopub.status.idle": "2023-05-31T12:46:52.885801Z",
     "shell.execute_reply": "2023-05-31T12:46:52.885062Z",
     "shell.execute_reply.started": "2023-05-31T12:46:52.878989Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('高级产品经理', 3),\n",
       " ('文创产品经理', 2),\n",
       " ('可视化产品经理', 1),\n",
       " ('产品经理-肿瘤', 1),\n",
       " ('AI应用产品经理', 1),\n",
       " ('B端产品经理', 1),\n",
       " ('品质PM', 1),\n",
       " ('网约车供需调度产品经理', 1),\n",
       " ('穿戴甲产品经理', 1),\n",
       " ('云网产品经理', 1),\n",
       " ('软件产品经理', 1),\n",
       " ('医药产品经理', 1),\n",
       " ('ERP产品经理', 1),\n",
       " ('风控产品经理', 1),\n",
       " ('IOT产品经理', 1),\n",
       " ('数据产品经理', 1),\n",
       " ('商业化产品经理', 1),\n",
       " ('AI产品经理岗', 1),\n",
       " ('电商产品经理', 1),\n",
       " ('高级产品', 1),\n",
       " ('高级硬件产品经理', 1)]"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 列表推导式\n",
    "PM_title_words = [(df_job_title.index.tolist()[i],df_job_title.values.tolist()[i]) for i in range (1,len(df_job_title.index.tolist()))]\n",
    "PM_title_words"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:46:58.511550Z",
     "iopub.status.busy": "2023-05-31T12:46:58.510877Z",
     "iopub.status.idle": "2023-05-31T12:46:58.523247Z",
     "shell.execute_reply": "2023-05-31T12:46:58.522422Z",
     "shell.execute_reply.started": "2023-05-31T12:46:58.511512Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [],
   "source": [
    "from pyecharts import options as opts\n",
    "from pyecharts.charts import WordCloud\n",
    "from pyecharts.globals import SymbolType\n",
    "\n",
    "\n",
    "c = (\n",
    "    WordCloud()\n",
    "    .add(\"\", PM_title_words, word_size_range=[20, 100], shape=SymbolType.DIAMOND)\n",
    "    .set_global_opts(title_opts=opts.TitleOpts(title=\"WordCloud-shape-diamond\"))\n",
    "    .render(\"title_wordcloud_diamond.html\")\n",
    ")\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# job.labels\n",
    "* 目标：统计labels 的数量并做词云图"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:47:00.568863Z",
     "iopub.status.busy": "2023-05-31T12:47:00.568213Z",
     "iopub.status.idle": "2023-05-31T12:47:00.575944Z",
     "shell.execute_reply": "2023-05-31T12:47:00.575222Z",
     "shell.execute_reply.started": "2023-05-31T12:47:00.568830Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0                                        ['中台产品', '爬虫']\n",
       "1     ['AI人工智能产品', '数据产品', '推荐产品', '策略产品', '工具产品', '...\n",
       "2     ['数据产品', '计算机软件', '企业服务', '产品设计', '竞品分析', '原型设...\n",
       "3                               ['新零售', '商品中心', '产品经理']\n",
       "4                                              ['数据产品']\n",
       "5     ['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', ...\n",
       "6                                                    []\n",
       "7                                                    []\n",
       "8     ['财务产品', '数据产品', '交易产品', '电子商务', '产品规划', '产品设计...\n",
       "9     ['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', ...\n",
       "10                                                   []\n",
       "11    ['产品经理', '积木', '玩具', '潮玩', '产品企划', '市场分析', '产品...\n",
       "12    ['ERP产品', '工具产品', 'ERP系统', 'IT互联网', '贸易/进出口', ...\n",
       "13    ['广告产品', '商业产品', '策略产品', '广告行业', '广告营销', '旅游行业...\n",
       "14    ['产品规划', '电商产品', '供应链产品', 'CRM产品', 'ERP产品', '电...\n",
       "15                                                   []\n",
       "16    ['数据产品', '平台产品', '工具产品', '人工智能', '产品设计', 'Axur...\n",
       "17    ['硬件产品', '商业产品', '策略产品', '硬件系统集成', '用户研究', '竞品...\n",
       "18                    ['AI产品', '机器学习', '业务化建模', '数据标注']\n",
       "19               ['原型设计', '需求分析', '物联网', 'IOT', 'AIOT']\n",
       "20                                                   []\n",
       "21    ['需求分析', '产品经理', 'CRM产品', 'CRM系统', 'B端产品', '客户...\n",
       "22                                                   []\n",
       "23                                                   []\n",
       "24                                                   []\n",
       "25                                             ['产品策划']\n",
       "26                   ['供应链产品', 'ERP产品', '后台产品', 'to B']\n",
       "27                             ['策略产品', '产品规划', '市场调研']\n",
       "28                                                   []\n",
       "29    ['风控产品', '安全产品', '工具产品', '内容产品', '平台产品', '策略产品...\n",
       "30                 ['AI人工智能产品', '硬件产品', '智能硬件', '竞品分析']\n",
       "31    ['休闲食品', '新品上市', '市场调研', '渠道分析', '消费者研究', '活动策划']\n",
       "32                             ['用户研究', '产品规划', '数据分析']\n",
       "33    ['产品包装', '产品测试', '产品卖点', '渠道管理', '产品管理', '产品库存...\n",
       "34                   ['硬件产品', '智能硬件', '硬件系统集成', '教育行业']\n",
       "35    ['工具产品', '产品设计', '需求分析', '需求管理', '原型设计', '流程设计...\n",
       "36    ['产品设计', '架构设计', '供应链产品', '中台产品', '产品规划', '电子商...\n",
       "37                                                   []\n",
       "38                             ['工具产品', '团队管理', '产品规划']\n",
       "39    ['产品规划', '产品设计', '团队管理', '用户研究', 'Xmind', 'Vis...\n",
       "Name: job.labels, dtype: object"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['job.labels']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:47:01.890494Z",
     "iopub.status.busy": "2023-05-31T12:47:01.889832Z",
     "iopub.status.idle": "2023-05-31T12:47:01.897171Z",
     "shell.execute_reply": "2023-05-31T12:47:01.896385Z",
     "shell.execute_reply.started": "2023-05-31T12:47:01.890461Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([\"['中台产品', '爬虫']\",\n",
       "       \"['AI人工智能产品', '数据产品', '推荐产品', '策略产品', '工具产品', '人工智能', '团队管理', '产品规划']\",\n",
       "       \"['数据产品', '计算机软件', '企业服务', '产品设计', '竞品分析', '原型设计', '用户研究', '需求分析', '产品规划', '数据分析']\",\n",
       "       \"['新零售', '商品中心', '产品经理']\", \"['数据产品']\",\n",
       "       \"['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', '产品设计', '数据分析']\",\n",
       "       '[]', '[]',\n",
       "       \"['财务产品', '数据产品', '交易产品', '电子商务', '产品规划', '产品设计', '用户研究']\",\n",
       "       \"['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', '产品设计', '数据分析']\",\n",
       "       '[]', \"['产品经理', '积木', '玩具', '潮玩', '产品企划', '市场分析', '产品规划', '爆品']\",\n",
       "       \"['ERP产品', '工具产品', 'ERP系统', 'IT互联网', '贸易/进出口', '消费品', '产品设计', '产品优化', '产品规划', '需求分析']\",\n",
       "       \"['广告产品', '商业产品', '策略产品', '广告行业', '广告营销', '旅游行业', '产品设计', '产品规划', '产品优化', '数据分析']\",\n",
       "       \"['产品规划', '电商产品', '供应链产品', 'CRM产品', 'ERP产品', '电子商务', '家电行业', '消费品', '批发/零售', 'to C']\",\n",
       "       '[]',\n",
       "       \"['数据产品', '平台产品', '工具产品', '人工智能', '产品设计', 'Axure', '流程设计', 'Visio', '墨刀', '产品规划']\",\n",
       "       \"['硬件产品', '商业产品', '策略产品', '硬件系统集成', '用户研究', '竞品分析', '产品规划', '市场调研', '团队管理']\",\n",
       "       \"['AI产品', '机器学习', '业务化建模', '数据标注']\",\n",
       "       \"['原型设计', '需求分析', '物联网', 'IOT', 'AIOT']\", '[]',\n",
       "       \"['需求分析', '产品经理', 'CRM产品', 'CRM系统', 'B端产品', '客户关系管理系统', '经销渠道管理']\",\n",
       "       '[]', '[]', '[]', \"['产品策划']\", \"['供应链产品', 'ERP产品', '后台产品', 'to B']\",\n",
       "       \"['策略产品', '产品规划', '市场调研']\", '[]',\n",
       "       \"['风控产品', '安全产品', '工具产品', '内容产品', '平台产品', '策略产品', '电商产品', '电子商务', '安保行业', 'IT互联网']\",\n",
       "       \"['AI人工智能产品', '硬件产品', '智能硬件', '竞品分析']\",\n",
       "       \"['休闲食品', '新品上市', '市场调研', '渠道分析', '消费者研究', '活动策划']\",\n",
       "       \"['用户研究', '产品规划', '数据分析']\",\n",
       "       \"['产品包装', '产品测试', '产品卖点', '渠道管理', '产品管理', '产品库存', '竞品分析', '产品规划', '包装规划', '新品开发']\",\n",
       "       \"['硬件产品', '智能硬件', '硬件系统集成', '教育行业']\",\n",
       "       \"['工具产品', '产品设计', '需求分析', '需求管理', '原型设计', '流程设计', '需求确认', '团队管理']\",\n",
       "       \"['产品设计', '架构设计', '供应链产品', '中台产品', '产品规划', '电子商务', 'to B', '需求分析', '流程设计']\",\n",
       "       '[]', \"['工具产品', '团队管理', '产品规划']\",\n",
       "       \"['产品规划', '产品设计', '团队管理', '用户研究', 'Xmind', 'Visio', 'Axure']\"],\n",
       "      dtype=object)"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['job.labels'].values"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:47:02.790242Z",
     "iopub.status.busy": "2023-05-31T12:47:02.789572Z",
     "iopub.status.idle": "2023-05-31T12:47:02.797646Z",
     "shell.execute_reply": "2023-05-31T12:47:02.796785Z",
     "shell.execute_reply.started": "2023-05-31T12:47:02.790207Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([list(['中台产品', '爬虫']),\n",
       "       list(['AI人工智能产品', '数据产品', '推荐产品', '策略产品', '工具产品', '人工智能', '团队管理', '产品规划']),\n",
       "       list(['数据产品', '计算机软件', '企业服务', '产品设计', '竞品分析', '原型设计', '用户研究', '需求分析', '产品规划', '数据分析']),\n",
       "       list(['新零售', '商品中心', '产品经理']), list(['数据产品']),\n",
       "       list(['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', '产品设计', '数据分析']),\n",
       "       list([]), list([]),\n",
       "       list(['财务产品', '数据产品', '交易产品', '电子商务', '产品规划', '产品设计', '用户研究']),\n",
       "       list(['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', '产品设计', '数据分析']),\n",
       "       list([]),\n",
       "       list(['产品经理', '积木', '玩具', '潮玩', '产品企划', '市场分析', '产品规划', '爆品']),\n",
       "       list(['ERP产品', '工具产品', 'ERP系统', 'IT互联网', '贸易/进出口', '消费品', '产品设计', '产品优化', '产品规划', '需求分析']),\n",
       "       list(['广告产品', '商业产品', '策略产品', '广告行业', '广告营销', '旅游行业', '产品设计', '产品规划', '产品优化', '数据分析']),\n",
       "       list(['产品规划', '电商产品', '供应链产品', 'CRM产品', 'ERP产品', '电子商务', '家电行业', '消费品', '批发/零售', 'to C']),\n",
       "       list([]),\n",
       "       list(['数据产品', '平台产品', '工具产品', '人工智能', '产品设计', 'Axure', '流程设计', 'Visio', '墨刀', '产品规划']),\n",
       "       list(['硬件产品', '商业产品', '策略产品', '硬件系统集成', '用户研究', '竞品分析', '产品规划', '市场调研', '团队管理']),\n",
       "       list(['AI产品', '机器学习', '业务化建模', '数据标注']),\n",
       "       list(['原型设计', '需求分析', '物联网', 'IOT', 'AIOT']), list([]),\n",
       "       list(['需求分析', '产品经理', 'CRM产品', 'CRM系统', 'B端产品', '客户关系管理系统', '经销渠道管理']),\n",
       "       list([]), list([]), list([]), list(['产品策划']),\n",
       "       list(['供应链产品', 'ERP产品', '后台产品', 'to B']),\n",
       "       list(['策略产品', '产品规划', '市场调研']), list([]),\n",
       "       list(['风控产品', '安全产品', '工具产品', '内容产品', '平台产品', '策略产品', '电商产品', '电子商务', '安保行业', 'IT互联网']),\n",
       "       list(['AI人工智能产品', '硬件产品', '智能硬件', '竞品分析']),\n",
       "       list(['休闲食品', '新品上市', '市场调研', '渠道分析', '消费者研究', '活动策划']),\n",
       "       list(['用户研究', '产品规划', '数据分析']),\n",
       "       list(['产品包装', '产品测试', '产品卖点', '渠道管理', '产品管理', '产品库存', '竞品分析', '产品规划', '包装规划', '新品开发']),\n",
       "       list(['硬件产品', '智能硬件', '硬件系统集成', '教育行业']),\n",
       "       list(['工具产品', '产品设计', '需求分析', '需求管理', '原型设计', '流程设计', '需求确认', '团队管理']),\n",
       "       list(['产品设计', '架构设计', '供应链产品', '中台产品', '产品规划', '电子商务', 'to B', '需求分析', '流程设计']),\n",
       "       list([]), list(['工具产品', '团队管理', '产品规划']),\n",
       "       list(['产品规划', '产品设计', '团队管理', '用户研究', 'Xmind', 'Visio', 'Axure'])],\n",
       "      dtype=object)"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['job.labels'].apply(lambda x:eval(x)).values"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:47:05.007435Z",
     "iopub.status.busy": "2023-05-31T12:47:05.006063Z",
     "iopub.status.idle": "2023-05-31T12:47:05.017735Z",
     "shell.execute_reply": "2023-05-31T12:47:05.016866Z",
     "shell.execute_reply.started": "2023-05-31T12:47:05.007386Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[['中台产品', '爬虫'],\n",
       " ['AI人工智能产品', '数据产品', '推荐产品', '策略产品', '工具产品', '人工智能', '团队管理', '产品规划'],\n",
       " ['数据产品',\n",
       "  '计算机软件',\n",
       "  '企业服务',\n",
       "  '产品设计',\n",
       "  '竞品分析',\n",
       "  '原型设计',\n",
       "  '用户研究',\n",
       "  '需求分析',\n",
       "  '产品规划',\n",
       "  '数据分析'],\n",
       " ['新零售', '商品中心', '产品经理'],\n",
       " ['数据产品'],\n",
       " ['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', '产品设计', '数据分析'],\n",
       " [],\n",
       " [],\n",
       " ['财务产品', '数据产品', '交易产品', '电子商务', '产品规划', '产品设计', '用户研究'],\n",
       " ['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', '产品设计', '数据分析'],\n",
       " [],\n",
       " ['产品经理', '积木', '玩具', '潮玩', '产品企划', '市场分析', '产品规划', '爆品'],\n",
       " ['ERP产品',\n",
       "  '工具产品',\n",
       "  'ERP系统',\n",
       "  'IT互联网',\n",
       "  '贸易/进出口',\n",
       "  '消费品',\n",
       "  '产品设计',\n",
       "  '产品优化',\n",
       "  '产品规划',\n",
       "  '需求分析'],\n",
       " ['广告产品',\n",
       "  '商业产品',\n",
       "  '策略产品',\n",
       "  '广告行业',\n",
       "  '广告营销',\n",
       "  '旅游行业',\n",
       "  '产品设计',\n",
       "  '产品规划',\n",
       "  '产品优化',\n",
       "  '数据分析'],\n",
       " ['产品规划',\n",
       "  '电商产品',\n",
       "  '供应链产品',\n",
       "  'CRM产品',\n",
       "  'ERP产品',\n",
       "  '电子商务',\n",
       "  '家电行业',\n",
       "  '消费品',\n",
       "  '批发/零售',\n",
       "  'to C'],\n",
       " [],\n",
       " ['数据产品',\n",
       "  '平台产品',\n",
       "  '工具产品',\n",
       "  '人工智能',\n",
       "  '产品设计',\n",
       "  'Axure',\n",
       "  '流程设计',\n",
       "  'Visio',\n",
       "  '墨刀',\n",
       "  '产品规划'],\n",
       " ['硬件产品', '商业产品', '策略产品', '硬件系统集成', '用户研究', '竞品分析', '产品规划', '市场调研', '团队管理'],\n",
       " ['AI产品', '机器学习', '业务化建模', '数据标注'],\n",
       " ['原型设计', '需求分析', '物联网', 'IOT', 'AIOT'],\n",
       " [],\n",
       " ['需求分析', '产品经理', 'CRM产品', 'CRM系统', 'B端产品', '客户关系管理系统', '经销渠道管理'],\n",
       " [],\n",
       " [],\n",
       " [],\n",
       " ['产品策划'],\n",
       " ['供应链产品', 'ERP产品', '后台产品', 'to B'],\n",
       " ['策略产品', '产品规划', '市场调研'],\n",
       " [],\n",
       " ['风控产品',\n",
       "  '安全产品',\n",
       "  '工具产品',\n",
       "  '内容产品',\n",
       "  '平台产品',\n",
       "  '策略产品',\n",
       "  '电商产品',\n",
       "  '电子商务',\n",
       "  '安保行业',\n",
       "  'IT互联网'],\n",
       " ['AI人工智能产品', '硬件产品', '智能硬件', '竞品分析'],\n",
       " ['休闲食品', '新品上市', '市场调研', '渠道分析', '消费者研究', '活动策划'],\n",
       " ['用户研究', '产品规划', '数据分析'],\n",
       " ['产品包装',\n",
       "  '产品测试',\n",
       "  '产品卖点',\n",
       "  '渠道管理',\n",
       "  '产品管理',\n",
       "  '产品库存',\n",
       "  '竞品分析',\n",
       "  '产品规划',\n",
       "  '包装规划',\n",
       "  '新品开发'],\n",
       " ['硬件产品', '智能硬件', '硬件系统集成', '教育行业'],\n",
       " ['工具产品', '产品设计', '需求分析', '需求管理', '原型设计', '流程设计', '需求确认', '团队管理'],\n",
       " ['产品设计', '架构设计', '供应链产品', '中台产品', '产品规划', '电子商务', 'to B', '需求分析', '流程设计'],\n",
       " [],\n",
       " ['工具产品', '团队管理', '产品规划'],\n",
       " ['产品规划', '产品设计', '团队管理', '用户研究', 'Xmind', 'Visio', 'Axure']]"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['job.labels'].apply(lambda x:eval(x)).tolist()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:06:43.283804Z",
     "iopub.status.busy": "2023-06-14T10:06:43.283252Z",
     "iopub.status.idle": "2023-06-14T10:06:43.295407Z",
     "shell.execute_reply": "2023-06-14T10:06:43.294467Z",
     "shell.execute_reply.started": "2023-06-14T10:06:43.283771Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['金融产品',\n",
       " '征信行业',\n",
       " '金融行业',\n",
       " '金融理财/贷款',\n",
       " '批发/零售',\n",
       " '产品优化',\n",
       " '产品设计',\n",
       " '用户研究',\n",
       " '交互设计',\n",
       " '团队管理',\n",
       " 'IT互联网',\n",
       " 'SaaS产品',\n",
       " 'to B',\n",
       " '产品设计',\n",
       " '移动端产品',\n",
       " '交易产品',\n",
       " '金融行业',\n",
       " '金融产品经理',\n",
       " '区块链',\n",
       " '产品规划',\n",
       " 'web3',\n",
       " '数据产品',\n",
       " 'to C',\n",
       " 'IT互联网',\n",
       " '征信行业',\n",
       " '金融产品',\n",
       " '征信行业',\n",
       " '金融行业',\n",
       " '金融理财/贷款',\n",
       " '批发/零售',\n",
       " '产品优化',\n",
       " '产品设计',\n",
       " '用户研究',\n",
       " '团队管理',\n",
       " '交互设计',\n",
       " '商业产品',\n",
       " '用户研究',\n",
       " '团队管理',\n",
       " '产品规划',\n",
       " '数据分析',\n",
       " '硬件产品',\n",
       " '游戏产品',\n",
       " '需求分析',\n",
       " 'IT互联网',\n",
       " '区块链',\n",
       " 'web端产品',\n",
       " '产品规划',\n",
       " '用户研究',\n",
       " '市场调研',\n",
       " '原型设计',\n",
       " '产品优化',\n",
       " 'Axure',\n",
       " 'CRM产品',\n",
       " '策略产品',\n",
       " '工具产品',\n",
       " '数据产品',\n",
       " 'to C',\n",
       " 'CRM系统',\n",
       " '广告营销',\n",
       " '用户研究',\n",
       " '产品设计',\n",
       " '产品规划',\n",
       " '量化交易',\n",
       " 'CTA策略',\n",
       " '投资产品',\n",
       " '工具产品',\n",
       " '电商产品',\n",
       " '通讯/网络设备',\n",
       " '广告营销',\n",
       " '电子商务',\n",
       " '产品优化',\n",
       " '数据产品',\n",
       " '征信行业',\n",
       " '产品优化',\n",
       " '产品设计',\n",
       " '产品规划',\n",
       " '智能家居',\n",
       " '物联网',\n",
       " '智慧家居',\n",
       " '智能硬件',\n",
       " '照明产品',\n",
       " '金融产品',\n",
       " '产品经理',\n",
       " '投资管理',\n",
       " '资产管理',\n",
       " '财富管理',\n",
       " 'Product Manager',\n",
       " '基金类',\n",
       " '商业产品',\n",
       " '云计算',\n",
       " '移动端产品',\n",
       " '用户研究',\n",
       " '竞品分析',\n",
       " '团队管理',\n",
       " '需求挖掘',\n",
       " '数据分析',\n",
       " '需求分析',\n",
       " '产品规划',\n",
       " '需求调研',\n",
       " '产品设计',\n",
       " '计算机软件',\n",
       " '通讯/网络设备',\n",
       " '后台产品',\n",
       " 'SaaS产品',\n",
       " 'CRM软件',\n",
       " '需求确认',\n",
       " '营销项目',\n",
       " 'CRM系统',\n",
       " '客户管理',\n",
       " 'RFP',\n",
       " '技术支持',\n",
       " '通信领域',\n",
       " 'saas',\n",
       " 'ActionScript',\n",
       " '新产品导入',\n",
       " 'EHS',\n",
       " 'PPE',\n",
       " '安全生产',\n",
       " '职业卫生',\n",
       " '工业卫生',\n",
       " 'HSE',\n",
       " 'ESH',\n",
       " 'Process safety',\n",
       " '工艺安全',\n",
       " '过程安全',\n",
       " 'HCM',\n",
       " '售前',\n",
       " '本地化',\n",
       " '海外',\n",
       " '基金产品总监',\n",
       " '基金筛选',\n",
       " 'FOF基金',\n",
       " '对冲基金',\n",
       " '结构化产品',\n",
       " '基金尽调',\n",
       " '海外基金',\n",
       " '市场营销',\n",
       " '竞品分析',\n",
       " '社交媒体',\n",
       " '社交媒介',\n",
       " '营销活动',\n",
       " '广告/传媒/文化',\n",
       " 'IT/互联网/软件',\n",
       " '施工现场管理',\n",
       " '建筑施工',\n",
       " 'PROJECT',\n",
       " '营销策划',\n",
       " '品牌策划',\n",
       " '自媒体策划',\n",
       " '社交媒体',\n",
       " '社交媒介',\n",
       " '营销活动',\n",
       " '广告/传媒/文化',\n",
       " 'IT/互联网/软件',\n",
       " '消费品',\n",
       " '施工现场管理',\n",
       " '安防工程',\n",
       " '建筑施工',\n",
       " 'ActionScript',\n",
       " '美元VC',\n",
       " '清华姚班',\n",
       " '清华智班',\n",
       " '清华量信班',\n",
       " '机器人',\n",
       " '人工智能研究院',\n",
       " 'AI',\n",
       " 'OpenAI',\n",
       " '用户运营',\n",
       " '包装设计',\n",
       " 'UG',\n",
       " 'SolidWorks',\n",
       " '结构设计',\n",
       " '3D设计',\n",
       " 'keyshot',\n",
       " '数据产品',\n",
       " '工具产品',\n",
       " '平台产品',\n",
       " '数据分析',\n",
       " '团队管理',\n",
       " '平台产品',\n",
       " '增长产品',\n",
       " 'IT互联网',\n",
       " '产品设计',\n",
       " '用户研究',\n",
       " '团队管理',\n",
       " '对冲基金',\n",
       " '医疗行业分析师',\n",
       " '用户运营',\n",
       " '产品运营',\n",
       " '质量管理',\n",
       " '风控项目',\n",
       " '.NET',\n",
       " 'ASP.NET',\n",
       " 'ClickHouse',\n",
       " '量化私募',\n",
       " '门店销售',\n",
       " '大数据',\n",
       " '流程管理',\n",
       " '交付管理',\n",
       " '流程优化',\n",
       " '化工行业',\n",
       " 'IT/互联网/软件',\n",
       " 'PMP',\n",
       " 'PMP项目管理认证',\n",
       " '项目管理师',\n",
       " '项目工程师',\n",
       " '香港工作',\n",
       " '土木工程',\n",
       " '结构工程',\n",
       " '金融产品',\n",
       " '金融行业',\n",
       " '征信行业',\n",
       " '用户研究',\n",
       " '产品规划',\n",
       " '数据产品',\n",
       " '数据挖掘',\n",
       " '质量管理',\n",
       " '风控项目',\n",
       " 'ASP.NET',\n",
       " '.NET',\n",
       " '项目施工管理',\n",
       " '金融产品',\n",
       " '互联网金融',\n",
       " '金融理财/贷款',\n",
       " '金融行业',\n",
       " 'IT互联网',\n",
       " '批发/零售',\n",
       " '产品设计',\n",
       " '产品规划',\n",
       " '团队管理',\n",
       " '出入库管理',\n",
       " '仓库管理',\n",
       " '订单管理',\n",
       " '库存管理',\n",
       " '库存盘点',\n",
       " '现场管理',\n",
       " '海外仓',\n",
       " '贸易/进出口',\n",
       " '电子产品及配件',\n",
       " '消费品',\n",
       " 'saas',\n",
       " '市场洞察',\n",
       " '客户管理',\n",
       " 'IT/互联网/软件',\n",
       " '电子/通信/硬件',\n",
       " '团队管理',\n",
       " '电子商务',\n",
       " '销售管理',\n",
       " '广告/传媒/文化',\n",
       " '学术/科研',\n",
       " '网络营销',\n",
       " '策划',\n",
       " '市场营销',\n",
       " 'office',\n",
       " '整合营销',\n",
       " '数据统计分析',\n",
       " '海外仓',\n",
       " '出入库管理',\n",
       " '库存盘点',\n",
       " '仓库管理',\n",
       " '库存管理',\n",
       " '现场管理',\n",
       " '消费品',\n",
       " '贸易/进出口',\n",
       " '交通/运输',\n",
       " '软件测试',\n",
       " 'selenium',\n",
       " 'appium',\n",
       " 'automation',\n",
       " '自动化',\n",
       " '自动化测试',\n",
       " 'SQL',\n",
       " '客户服务',\n",
       " '本科',\n",
       " '本科',\n",
       " '功能测试',\n",
       " '软件测试',\n",
       " '本科',\n",
       " '软件测试',\n",
       " '应用测试',\n",
       " '功能测试',\n",
       " 'iOS',\n",
       " 'Android',\n",
       " '本科']"
      ]
     },
     "execution_count": 46,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 列表的推导式\n",
    "PM_labels_list = [j for i in df_PM_gz['job.labels'].apply(lambda x:eval(x)).tolist() for j in i]\n",
    "PM_labels_list"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:06:44.897131Z",
     "iopub.status.busy": "2023-06-14T10:06:44.896602Z",
     "iopub.status.idle": "2023-06-14T10:06:44.909125Z",
     "shell.execute_reply": "2023-06-14T10:06:44.908412Z",
     "shell.execute_reply.started": "2023-06-14T10:06:44.897097Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('ASP.NET', 2),\n",
       " ('社交媒体', 2),\n",
       " ('建筑施工', 2),\n",
       " ('香港工作', 1),\n",
       " ('施工现场管理', 2),\n",
       " ('数据产品', 5),\n",
       " ('安防工程', 1),\n",
       " ('Axure', 1),\n",
       " ('机器人', 1),\n",
       " ('社交媒介', 2),\n",
       " ('财富管理', 1),\n",
       " ('HSE', 1),\n",
       " ('广告/传媒/文化', 3),\n",
       " ('海外仓', 2),\n",
       " ('售前', 1),\n",
       " ('订单管理', 1),\n",
       " ('移动端产品', 2),\n",
       " ('过程安全', 1),\n",
       " ('平台产品', 2),\n",
       " ('电商产品', 1),\n",
       " ('销售管理', 1),\n",
       " ('清华姚班', 1),\n",
       " ('竞品分析', 2),\n",
       " ('计算机软件', 1),\n",
       " ('电子商务', 2),\n",
       " ('工艺安全', 1),\n",
       " ('基金尽调', 1),\n",
       " ('基金类', 1),\n",
       " ('质量管理', 2),\n",
       " ('对冲基金', 2),\n",
       " ('CTA策略', 1),\n",
       " ('量化交易', 1),\n",
       " ('风控项目', 2),\n",
       " ('需求确认', 1),\n",
       " ('仓库管理', 2),\n",
       " ('团队管理', 8),\n",
       " ('3D设计', 1),\n",
       " ('整合营销', 1),\n",
       " ('云计算', 1),\n",
       " ('医疗行业分析师', 1),\n",
       " ('IT互联网', 5),\n",
       " ('物联网', 1),\n",
       " ('UG', 1),\n",
       " ('产品运营', 1),\n",
       " ('投资产品', 1),\n",
       " ('策略产品', 1),\n",
       " ('PMP项目管理认证', 1),\n",
       " ('selenium', 1),\n",
       " ('数据统计分析', 1),\n",
       " ('品牌策划', 1),\n",
       " ('PROJECT', 1),\n",
       " ('工业卫生', 1),\n",
       " ('用户研究', 8),\n",
       " ('资产管理', 1),\n",
       " ('游戏产品', 1),\n",
       " ('ActionScript', 2),\n",
       " ('电子产品及配件', 1),\n",
       " ('PMP', 1),\n",
       " ('web端产品', 1),\n",
       " ('通信领域', 1),\n",
       " ('流程管理', 1),\n",
       " ('appium', 1),\n",
       " ('automation', 1),\n",
       " ('CRM产品', 1),\n",
       " ('PPE', 1),\n",
       " ('消费品', 3),\n",
       " ('新产品导入', 1),\n",
       " ('量化私募', 1),\n",
       " ('网络营销', 1),\n",
       " ('产品经理', 1),\n",
       " ('化工行业', 1),\n",
       " ('交易产品', 1),\n",
       " ('区块链', 2),\n",
       " ('包装设计', 1),\n",
       " ('结构化产品', 1),\n",
       " ('大数据', 1),\n",
       " ('Android', 1),\n",
       " ('库存盘点', 2),\n",
       " ('商业产品', 2),\n",
       " ('功能测试', 2),\n",
       " ('项目管理师', 1),\n",
       " ('征信行业', 5),\n",
       " ('数据挖掘', 1),\n",
       " ('市场营销', 2),\n",
       " ('office', 1),\n",
       " ('技术支持', 1),\n",
       " ('SQL', 1),\n",
       " ('海外', 1),\n",
       " ('硬件产品', 1),\n",
       " ('安全生产', 1),\n",
       " ('saas', 2),\n",
       " ('现场管理', 2),\n",
       " ('职业卫生', 1),\n",
       " ('海外基金', 1),\n",
       " ('交通/运输', 1),\n",
       " ('产品优化', 5),\n",
       " ('keyshot', 1),\n",
       " ('SaaS产品', 2),\n",
       " ('美元VC', 1),\n",
       " ('客户管理', 2),\n",
       " ('结构工程', 1),\n",
       " ('用户运营', 2),\n",
       " ('AI', 1),\n",
       " ('软件测试', 3),\n",
       " ('自动化', 1),\n",
       " ('库存管理', 2),\n",
       " ('CRM系统', 2),\n",
       " ('学术/科研', 1),\n",
       " ('金融产品经理', 1),\n",
       " ('客户服务', 1),\n",
       " ('to C', 2),\n",
       " ('需求挖掘', 1),\n",
       " ('清华智班', 1),\n",
       " ('web3', 1),\n",
       " ('IT/互联网/软件', 4),\n",
       " ('FOF基金', 1),\n",
       " ('交互设计', 2),\n",
       " ('批发/零售', 3),\n",
       " ('EHS', 1),\n",
       " ('金融理财/贷款', 3),\n",
       " ('智慧家居', 1),\n",
       " ('后台产品', 1),\n",
       " ('原型设计', 1),\n",
       " ('本地化', 1),\n",
       " ('ClickHouse', 1),\n",
       " ('贸易/进出口', 2),\n",
       " ('金融产品', 5),\n",
       " ('智能硬件', 1),\n",
       " ('基金产品总监', 1),\n",
       " ('投资管理', 1),\n",
       " ('需求调研', 1),\n",
       " ('产品规划', 8),\n",
       " ('照明产品', 1),\n",
       " ('人工智能研究院', 1),\n",
       " ('互联网金融', 1),\n",
       " ('增长产品', 1),\n",
       " ('市场调研', 1),\n",
       " ('RFP', 1),\n",
       " ('应用测试', 1),\n",
       " ('自动化测试', 1),\n",
       " ('策划', 1),\n",
       " ('土木工程', 1),\n",
       " ('广告营销', 2),\n",
       " ('iOS', 1),\n",
       " ('to B', 1),\n",
       " ('ESH', 1),\n",
       " ('.NET', 2),\n",
       " ('电子/通信/硬件', 1),\n",
       " ('工具产品', 3),\n",
       " ('出入库管理', 2),\n",
       " ('产品设计', 8),\n",
       " ('本科', 4),\n",
       " ('基金筛选', 1),\n",
       " ('CRM软件', 1),\n",
       " ('金融行业', 5),\n",
       " ('交付管理', 1),\n",
       " ('HCM', 1),\n",
       " ('门店销售', 1),\n",
       " ('数据分析', 3),\n",
       " ('智能家居', 1),\n",
       " ('营销活动', 2),\n",
       " ('自媒体策划', 1),\n",
       " ('SolidWorks', 1),\n",
       " ('需求分析', 2),\n",
       " ('通讯/网络设备', 2),\n",
       " ('营销策划', 1),\n",
       " ('市场洞察', 1),\n",
       " ('流程优化', 1),\n",
       " ('营销项目', 1),\n",
       " ('Process safety', 1),\n",
       " ('OpenAI', 1),\n",
       " ('清华量信班', 1),\n",
       " ('项目工程师', 1),\n",
       " ('Product Manager', 1),\n",
       " ('结构设计', 1),\n",
       " ('项目施工管理', 1)]"
      ]
     },
     "execution_count": 47,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 创建words\n",
    "[(i,PM_labels_list.count(i)) for i in set(PM_labels_list)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:47:09.636514Z",
     "iopub.status.busy": "2023-05-31T12:47:09.635693Z",
     "iopub.status.idle": "2023-05-31T12:47:09.649754Z",
     "shell.execute_reply": "2023-05-31T12:47:09.648754Z",
     "shell.execute_reply.started": "2023-05-31T12:47:09.636465Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('渠道分析', 1),\n",
       " ('产品经理', 3),\n",
       " ('包装规划', 1),\n",
       " ('IOT', 1),\n",
       " ('产品库存', 1),\n",
       " ('物流快递', 2),\n",
       " ('O2O', 2),\n",
       " ('新零售', 1),\n",
       " ('机器学习', 1),\n",
       " ('爆品', 1),\n",
       " ('需求挖掘', 2),\n",
       " ('流程设计', 3),\n",
       " ('批发/零售', 1),\n",
       " ('财务产品', 1),\n",
       " ('玩具', 1),\n",
       " ('Visio', 2),\n",
       " ('架构设计', 1),\n",
       " ('新品上市', 1),\n",
       " ('新品开发', 1),\n",
       " ('物联网', 1),\n",
       " ('B端产品', 1),\n",
       " ('产品策划', 1),\n",
       " ('企业服务', 1),\n",
       " ('广告行业', 1),\n",
       " ('产品包装', 1),\n",
       " ('需求分析', 6),\n",
       " ('Xmind', 1),\n",
       " ('贸易/进出口', 1),\n",
       " ('旅游行业', 1),\n",
       " ('电商产品', 2),\n",
       " ('AI人工智能产品', 2),\n",
       " ('经销渠道管理', 1),\n",
       " ('智能硬件', 2),\n",
       " ('安全产品', 1),\n",
       " ('人工智能', 2),\n",
       " ('调度策略产品', 2),\n",
       " ('AIOT', 1),\n",
       " ('交易产品', 1),\n",
       " ('to B', 2),\n",
       " ('产品优化', 2),\n",
       " ('ERP产品', 3),\n",
       " ('消费者研究', 1),\n",
       " ('渠道管理', 1),\n",
       " ('数据标注', 1),\n",
       " ('推荐产品', 1),\n",
       " ('AI产品', 1),\n",
       " ('家电行业', 1),\n",
       " ('电子商务', 4),\n",
       " ('IT互联网', 2),\n",
       " ('市场分析', 1),\n",
       " ('休闲食品', 1),\n",
       " ('产品卖点', 1),\n",
       " ('产品设计', 10),\n",
       " ('竞品分析', 4),\n",
       " ('消费品', 2),\n",
       " ('爬虫', 1),\n",
       " ('to C', 1),\n",
       " ('供应链产品', 3),\n",
       " ('计算机软件', 1),\n",
       " ('硬件产品', 3),\n",
       " ('工具产品', 6),\n",
       " ('数据产品', 5),\n",
       " ('策略产品', 5),\n",
       " ('需求管理', 1),\n",
       " ('潮玩', 1),\n",
       " ('教育行业', 1),\n",
       " ('用户研究', 5),\n",
       " ('后台产品', 1),\n",
       " ('商品中心', 1),\n",
       " ('CRM产品', 2),\n",
       " ('需求确认', 1),\n",
       " ('硬件系统集成', 2),\n",
       " ('客户关系管理系统', 1),\n",
       " ('墨刀', 1),\n",
       " ('交通/运输/物流', 2),\n",
       " ('产品规划', 15),\n",
       " ('原型设计', 3),\n",
       " ('广告产品', 1),\n",
       " ('活动策划', 1),\n",
       " ('数据分析', 5),\n",
       " ('市场调研', 3),\n",
       " ('产品管理', 1),\n",
       " ('业务化建模', 1),\n",
       " ('产品企划', 1),\n",
       " ('内容产品', 1),\n",
       " ('风控产品', 1),\n",
       " ('CRM系统', 1),\n",
       " ('产品测试', 1),\n",
       " ('商业产品', 2),\n",
       " ('积木', 1),\n",
       " ('Axure', 2),\n",
       " ('安保行业', 1),\n",
       " ('平台产品', 2),\n",
       " ('中台产品', 2),\n",
       " ('ERP系统', 1),\n",
       " ('团队管理', 5),\n",
       " ('广告营销', 1)]"
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 数据处理\n",
    "PM_labels_words = [(i,PM_labels_list.count(i)) for i in set(PM_labels_list)]\n",
    "PM_labels_words"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:47:10.753144Z",
     "iopub.status.busy": "2023-05-31T12:47:10.752462Z",
     "iopub.status.idle": "2023-05-31T12:47:10.759293Z",
     "shell.execute_reply": "2023-05-31T12:47:10.758454Z",
     "shell.execute_reply.started": "2023-05-31T12:47:10.753109Z"
    },
    "scrolled": true,
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([\"['中台产品', '爬虫']\",\n",
       "       \"['AI人工智能产品', '数据产品', '推荐产品', '策略产品', '工具产品', '人工智能', '团队管理', '产品规划']\",\n",
       "       \"['数据产品', '计算机软件', '企业服务', '产品设计', '竞品分析', '原型设计', '用户研究', '需求分析', '产品规划', '数据分析']\",\n",
       "       \"['新零售', '商品中心', '产品经理']\", \"['数据产品']\",\n",
       "       \"['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', '产品设计', '数据分析']\",\n",
       "       '[]', '[]',\n",
       "       \"['财务产品', '数据产品', '交易产品', '电子商务', '产品规划', '产品设计', '用户研究']\",\n",
       "       \"['调度策略产品', '交通/运输/物流', '物流快递', 'O2O', '需求挖掘', '产品设计', '数据分析']\",\n",
       "       '[]', \"['产品经理', '积木', '玩具', '潮玩', '产品企划', '市场分析', '产品规划', '爆品']\",\n",
       "       \"['ERP产品', '工具产品', 'ERP系统', 'IT互联网', '贸易/进出口', '消费品', '产品设计', '产品优化', '产品规划', '需求分析']\",\n",
       "       \"['广告产品', '商业产品', '策略产品', '广告行业', '广告营销', '旅游行业', '产品设计', '产品规划', '产品优化', '数据分析']\",\n",
       "       \"['产品规划', '电商产品', '供应链产品', 'CRM产品', 'ERP产品', '电子商务', '家电行业', '消费品', '批发/零售', 'to C']\",\n",
       "       '[]',\n",
       "       \"['数据产品', '平台产品', '工具产品', '人工智能', '产品设计', 'Axure', '流程设计', 'Visio', '墨刀', '产品规划']\",\n",
       "       \"['硬件产品', '商业产品', '策略产品', '硬件系统集成', '用户研究', '竞品分析', '产品规划', '市场调研', '团队管理']\",\n",
       "       \"['AI产品', '机器学习', '业务化建模', '数据标注']\",\n",
       "       \"['原型设计', '需求分析', '物联网', 'IOT', 'AIOT']\", '[]',\n",
       "       \"['需求分析', '产品经理', 'CRM产品', 'CRM系统', 'B端产品', '客户关系管理系统', '经销渠道管理']\",\n",
       "       '[]', '[]', '[]', \"['产品策划']\", \"['供应链产品', 'ERP产品', '后台产品', 'to B']\",\n",
       "       \"['策略产品', '产品规划', '市场调研']\", '[]',\n",
       "       \"['风控产品', '安全产品', '工具产品', '内容产品', '平台产品', '策略产品', '电商产品', '电子商务', '安保行业', 'IT互联网']\",\n",
       "       \"['AI人工智能产品', '硬件产品', '智能硬件', '竞品分析']\",\n",
       "       \"['休闲食品', '新品上市', '市场调研', '渠道分析', '消费者研究', '活动策划']\",\n",
       "       \"['用户研究', '产品规划', '数据分析']\",\n",
       "       \"['产品包装', '产品测试', '产品卖点', '渠道管理', '产品管理', '产品库存', '竞品分析', '产品规划', '包装规划', '新品开发']\",\n",
       "       \"['硬件产品', '智能硬件', '硬件系统集成', '教育行业']\",\n",
       "       \"['工具产品', '产品设计', '需求分析', '需求管理', '原型设计', '流程设计', '需求确认', '团队管理']\",\n",
       "       \"['产品设计', '架构设计', '供应链产品', '中台产品', '产品规划', '电子商务', 'to B', '需求分析', '流程设计']\",\n",
       "       '[]', \"['工具产品', '团队管理', '产品规划']\",\n",
       "       \"['产品规划', '产品设计', '团队管理', '用户研究', 'Xmind', 'Visio', 'Axure']\"],\n",
       "      dtype=object)"
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['job.labels'].values"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 薪资-（平均薪资）"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:07:40.313087Z",
     "iopub.status.busy": "2023-06-14T10:07:40.312402Z",
     "iopub.status.idle": "2023-06-14T10:07:40.348489Z",
     "shell.execute_reply": "2023-06-14T10:07:40.347427Z",
     "shell.execute_reply.started": "2023-06-14T10:07:40.313043Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位标签</th>\n",
       "      <th>职位更新时间</th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>是否top职位</th>\n",
       "      <th>工作年限</th>\n",
       "      <th>学历</th>\n",
       "      <th>公司融资情况</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>行业</th>\n",
       "      <th>规模</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>['金融产品', '征信行业', '金融行业', '金融理财/贷款', '批发/零售', '...</td>\n",
       "      <td>20221118143443</td>\n",
       "      <td>产品经理 Product Manager</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>美股上市</td>\n",
       "      <td>金融壹账通</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>2000-5000人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>产品经理 (Senior) Product Manager</td>\n",
       "      <td>25-40k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>50-99人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>产品市场经理 Product Marketing Manager</td>\n",
       "      <td>40-60k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>50-99人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>['交易产品', '金融行业']</td>\n",
       "      <td>20221230112638</td>\n",
       "      <td>产品经理-海外交易柜台方向</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-中西区</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>硕士</td>\n",
       "      <td>沪深A股上市</td>\n",
       "      <td>中国国际金融股份有限公司</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>5000-10000人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>[]</td>\n",
       "      <td>20220810153828</td>\n",
       "      <td>Product Manager-Film Capacitor/Polymer Capacitor</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>False</td>\n",
       "      <td>10年以上</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>伊顿中国</td>\n",
       "      <td>机械/设备</td>\n",
       "      <td>10000人以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>104</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230522113042</td>\n",
       "      <td>风险合规经理（离岸财富管理产品）</td>\n",
       "      <td>40-70k·18薪</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>某公募基金理财子公司</td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>500-999人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>105</th>\n",
       "      <td>['本科']</td>\n",
       "      <td>20210223134718</td>\n",
       "      <td>产品经理</td>\n",
       "      <td>12-25k</td>\n",
       "      <td>香港-湾仔区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>华润数科控股有限公司</td>\n",
       "      <td>人工智能</td>\n",
       "      <td>2000-5000人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>106</th>\n",
       "      <td>['本科', '功能测试', '软件测试']</td>\n",
       "      <td>20230613110233</td>\n",
       "      <td>软件测试应届生（23届）</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>成都无敌勇士科技有限公司</td>\n",
       "      <td>游戏</td>\n",
       "      <td>100-499人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>107</th>\n",
       "      <td>['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']</td>\n",
       "      <td>20230506100220</td>\n",
       "      <td>APP测试工程师</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Winner Studio</td>\n",
       "      <td>游戏</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>108</th>\n",
       "      <td>['本科']</td>\n",
       "      <td>20230614100413</td>\n",
       "      <td>Graduate Engineer (Civil and MEP Engineering)</td>\n",
       "      <td>20-21k</td>\n",
       "      <td>香港-油尖旺区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>阿特金斯</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>100-499人</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>109 rows × 12 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                  职位标签          职位更新时间  \\\n",
       "0    ['金融产品', '征信行业', '金融行业', '金融理财/贷款', '批发/零售', '...  20221118143443   \n",
       "1         ['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']  20230602174402   \n",
       "2                                                   []  20230602174402   \n",
       "3                                     ['交易产品', '金融行业']  20221230112638   \n",
       "4                                                   []  20220810153828   \n",
       "..                                                 ...             ...   \n",
       "104                                                 []  20230522113042   \n",
       "105                                             ['本科']  20210223134718   \n",
       "106                             ['本科', '功能测试', '软件测试']  20230613110233   \n",
       "107   ['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']  20230506100220   \n",
       "108                                             ['本科']  20230614100413   \n",
       "\n",
       "                                                   职位          薪资       地区  \\\n",
       "0                                产品经理 Product Manager        薪资面议   香港-观塘区   \n",
       "1                       产品经理 (Senior) Product Manager      25-40k   香港-观塘区   \n",
       "2                    产品市场经理 Product Marketing Manager      40-60k   香港-观塘区   \n",
       "3                                       产品经理-海外交易柜台方向        薪资面议   香港-中西区   \n",
       "4    Product Manager-Film Capacitor/Polymer Capacitor        薪资面议    香港-东区   \n",
       "..                                                ...         ...      ...   \n",
       "104                                  风险合规经理（离岸财富管理产品）  40-70k·18薪       香港   \n",
       "105                                              产品经理      12-25k   香港-湾仔区   \n",
       "106                                      软件测试应届生（23届）      20-25k       香港   \n",
       "107                                          APP测试工程师      20-25k    香港-东区   \n",
       "108     Graduate Engineer (Civil and MEP Engineering)      20-21k  香港-油尖旺区   \n",
       "\n",
       "     是否top职位   工作年限     学历  公司融资情况                           公司名称        行业  \\\n",
       "0      False   3-5年   统招本科    美股上市                          金融壹账通      科技金融   \n",
       "1      False  5-10年     本科     NaN  KPay merchant service limited      科技金融   \n",
       "2      False   3-5年     本科     NaN  KPay merchant service limited      科技金融   \n",
       "3      False  5-10年     硕士  沪深A股上市                   中国国际金融股份有限公司  基金/证券/期货   \n",
       "4      False  10年以上   统招本科     NaN                           伊顿中国     机械/设备   \n",
       "..       ...    ...    ...     ...                            ...       ...   \n",
       "104    False  5-10年  硕士及以上   融资未公开                     某公募基金理财子公司  基金/证券/投资   \n",
       "105    False    NaN    NaN     NaN                     华润数科控股有限公司      人工智能   \n",
       "106    False    NaN    NaN   融资未公开                   成都无敌勇士科技有限公司        游戏   \n",
       "107    False    NaN    NaN     NaN                  Winner Studio        游戏   \n",
       "108    False    NaN    NaN     NaN                           阿特金斯   房地产开发经营   \n",
       "\n",
       "              规模  \n",
       "0     2000-5000人  \n",
       "1         50-99人  \n",
       "2         50-99人  \n",
       "3    5000-10000人  \n",
       "4       10000人以上  \n",
       "..           ...  \n",
       "104     500-999人  \n",
       "105   2000-5000人  \n",
       "106     100-499人  \n",
       "107          NaN  \n",
       "108     100-499人  \n",
       "\n",
       "[109 rows x 12 columns]"
      ]
     },
     "execution_count": 48,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# columns 重命名\r\n",
    "df_PM_gz = df_PM_gz.rename(columns={\r\n",
    "    'job.labels':'职位标签',\r\n",
    "    'job.refreshTime':'职位更新时间',\r\n",
    "    'job.title':'职位',\r\n",
    "    'job.salary':'薪资',\r\n",
    "    'job.dq':'地区',\r\n",
    "    'job.topJob':'是否top职位',\r\n",
    "    'job.requireWorkYears':'工作年限',\r\n",
    "    'job.requireEduLevel':'学历',\r\n",
    "    'comp.compStage':'公司融资情况',\r\n",
    "    'comp.compName':'公司名称',\r\n",
    "    'comp.compIndustry':'行业',\r\n",
    "    'comp.compScale':'规模'\r\n",
    "})\r\n",
    "df_PM_gz"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:07:58.546404Z",
     "iopub.status.busy": "2023-06-14T10:07:58.545896Z",
     "iopub.status.idle": "2023-06-14T10:07:58.569344Z",
     "shell.execute_reply": "2023-06-14T10:07:58.568600Z",
     "shell.execute_reply.started": "2023-06-14T10:07:58.546372Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位标签</th>\n",
       "      <th>职位更新时间</th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>是否top职位</th>\n",
       "      <th>工作年限</th>\n",
       "      <th>学历</th>\n",
       "      <th>公司融资情况</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>行业</th>\n",
       "      <th>规模</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>产品经理 (Senior) Product Manager</td>\n",
       "      <td>25-40k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>50-99人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>产品市场经理 Product Marketing Manager</td>\n",
       "      <td>40-60k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>50-99人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230206145433</td>\n",
       "      <td>Product Manager - Transaction</td>\n",
       "      <td>40-70k</td>\n",
       "      <td>香港-中西区</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>本科</td>\n",
       "      <td>C轮</td>\n",
       "      <td>多点生活(中国)网络科技有限公司</td>\n",
       "      <td>电子商务</td>\n",
       "      <td>2000-5000人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230331182809</td>\n",
       "      <td>Product Manager (AD to Dir)</td>\n",
       "      <td>30-60k</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>已上市</td>\n",
       "      <td>某国内基金证券上市公司</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230413145802</td>\n",
       "      <td>Product Manager (AD to Dir)</td>\n",
       "      <td>30-55k</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>学历不限</td>\n",
       "      <td>已上市</td>\n",
       "      <td>某国内基金/证券/期货上市公司</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>104</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230522113042</td>\n",
       "      <td>风险合规经理（离岸财富管理产品）</td>\n",
       "      <td>40-70k·18薪</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>某公募基金理财子公司</td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>500-999人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>105</th>\n",
       "      <td>['本科']</td>\n",
       "      <td>20210223134718</td>\n",
       "      <td>产品经理</td>\n",
       "      <td>12-25k</td>\n",
       "      <td>香港-湾仔区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>华润数科控股有限公司</td>\n",
       "      <td>人工智能</td>\n",
       "      <td>2000-5000人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>106</th>\n",
       "      <td>['本科', '功能测试', '软件测试']</td>\n",
       "      <td>20230613110233</td>\n",
       "      <td>软件测试应届生（23届）</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>成都无敌勇士科技有限公司</td>\n",
       "      <td>游戏</td>\n",
       "      <td>100-499人</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>107</th>\n",
       "      <td>['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']</td>\n",
       "      <td>20230506100220</td>\n",
       "      <td>APP测试工程师</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Winner Studio</td>\n",
       "      <td>游戏</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>108</th>\n",
       "      <td>['本科']</td>\n",
       "      <td>20230614100413</td>\n",
       "      <td>Graduate Engineer (Civil and MEP Engineering)</td>\n",
       "      <td>20-21k</td>\n",
       "      <td>香港-油尖旺区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>阿特金斯</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>100-499人</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>88 rows × 12 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 职位标签          职位更新时间  \\\n",
       "1        ['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']  20230602174402   \n",
       "2                                                  []  20230602174402   \n",
       "5                                                  []  20230206145433   \n",
       "6                                                  []  20230331182809   \n",
       "7                                                  []  20230413145802   \n",
       "..                                                ...             ...   \n",
       "104                                                []  20230522113042   \n",
       "105                                            ['本科']  20210223134718   \n",
       "106                            ['本科', '功能测试', '软件测试']  20230613110233   \n",
       "107  ['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']  20230506100220   \n",
       "108                                            ['本科']  20230614100413   \n",
       "\n",
       "                                                职位          薪资       地区  \\\n",
       "1                    产品经理 (Senior) Product Manager      25-40k   香港-观塘区   \n",
       "2                 产品市场经理 Product Marketing Manager      40-60k   香港-观塘区   \n",
       "5                    Product Manager - Transaction      40-70k   香港-中西区   \n",
       "6                      Product Manager (AD to Dir)      30-60k       香港   \n",
       "7                      Product Manager (AD to Dir)      30-55k       香港   \n",
       "..                                             ...         ...      ...   \n",
       "104                               风险合规经理（离岸财富管理产品）  40-70k·18薪       香港   \n",
       "105                                           产品经理      12-25k   香港-湾仔区   \n",
       "106                                   软件测试应届生（23届）      20-25k       香港   \n",
       "107                                       APP测试工程师      20-25k    香港-东区   \n",
       "108  Graduate Engineer (Civil and MEP Engineering)      20-21k  香港-油尖旺区   \n",
       "\n",
       "     是否top职位   工作年限     学历 公司融资情况                           公司名称        行业  \\\n",
       "1      False  5-10年     本科    NaN  KPay merchant service limited      科技金融   \n",
       "2      False   3-5年     本科    NaN  KPay merchant service limited      科技金融   \n",
       "5      False  5-10年     本科     C轮               多点生活(中国)网络科技有限公司      电子商务   \n",
       "6      False  5-10年  本科及以上    已上市                    某国内基金证券上市公司  基金/证券/期货   \n",
       "7      False  5-10年   学历不限    已上市                某国内基金/证券/期货上市公司  基金/证券/期货   \n",
       "..       ...    ...    ...    ...                            ...       ...   \n",
       "104    False  5-10年  硕士及以上  融资未公开                     某公募基金理财子公司  基金/证券/投资   \n",
       "105    False    NaN    NaN    NaN                     华润数科控股有限公司      人工智能   \n",
       "106    False    NaN    NaN  融资未公开                   成都无敌勇士科技有限公司        游戏   \n",
       "107    False    NaN    NaN    NaN                  Winner Studio        游戏   \n",
       "108    False    NaN    NaN    NaN                           阿特金斯   房地产开发经营   \n",
       "\n",
       "             规模  \n",
       "1        50-99人  \n",
       "2        50-99人  \n",
       "5    2000-5000人  \n",
       "6           NaN  \n",
       "7           NaN  \n",
       "..          ...  \n",
       "104    500-999人  \n",
       "105  2000-5000人  \n",
       "106    100-499人  \n",
       "107         NaN  \n",
       "108    100-499人  \n",
       "\n",
       "[88 rows x 12 columns]"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "非薪资面议 = df_PM_gz [ ~df_PM_gz['薪资'].str.contains(\"面议|元/天\")]\r\n",
    "非薪资面议"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:08:10.656445Z",
     "iopub.status.busy": "2023-06-14T10:08:10.655807Z",
     "iopub.status.idle": "2023-06-14T10:08:10.665916Z",
     "shell.execute_reply": "2023-06-14T10:08:10.665090Z",
     "shell.execute_reply.started": "2023-06-14T10:08:10.656414Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[['25-40k'],\n",
       " ['40-60k'],\n",
       " ['40-70k'],\n",
       " ['30-60k'],\n",
       " ['30-55k'],\n",
       " ['50-55k'],\n",
       " ['14-40k', '14'],\n",
       " ['45-75k', '15'],\n",
       " ['25-30k'],\n",
       " ['35-65k'],\n",
       " ['35-65k'],\n",
       " ['15-25k'],\n",
       " ['50-80k'],\n",
       " ['20-30k'],\n",
       " ['120-240k', '30'],\n",
       " ['30-50k'],\n",
       " ['30-45k'],\n",
       " ['20-40k', '15'],\n",
       " ['22-30k'],\n",
       " ['30-60k'],\n",
       " ['35-65k'],\n",
       " ['40-50k'],\n",
       " ['20-30k'],\n",
       " ['30-50k'],\n",
       " ['25-45k'],\n",
       " ['30-40k', '20'],\n",
       " ['30-45k'],\n",
       " ['15-30k', '14'],\n",
       " ['35-40k'],\n",
       " ['35-55k'],\n",
       " ['20-45k'],\n",
       " ['25-30k', '13'],\n",
       " ['15-30k'],\n",
       " ['20-35k', '15'],\n",
       " ['1-2k'],\n",
       " ['70-100k', '16'],\n",
       " ['60-90k', '16'],\n",
       " ['70-100k', '22'],\n",
       " ['30-50k'],\n",
       " ['15-25k'],\n",
       " ['15-25k'],\n",
       " ['35-55k'],\n",
       " ['15-16k'],\n",
       " ['15-30k', '13'],\n",
       " ['50-80k'],\n",
       " ['60-90k', '15'],\n",
       " ['85-100k', '24'],\n",
       " ['15-30k'],\n",
       " ['25-40k', '15'],\n",
       " ['40-50k'],\n",
       " ['70-100k'],\n",
       " ['30-60k'],\n",
       " ['70-100k', '16'],\n",
       " ['18-25k'],\n",
       " ['30-60k', '24'],\n",
       " ['40-60k'],\n",
       " ['30-40k', '16'],\n",
       " ['40-70k'],\n",
       " ['25-30k'],\n",
       " ['15-30k'],\n",
       " ['30-35k'],\n",
       " ['20-30k'],\n",
       " ['30-50k', '16'],\n",
       " ['3-5k', '15'],\n",
       " ['12-24k'],\n",
       " ['15-30k'],\n",
       " ['30-40k'],\n",
       " ['15-30k'],\n",
       " ['10-16k'],\n",
       " ['29-50k', '16'],\n",
       " ['25-30k'],\n",
       " ['20-35k', '15'],\n",
       " ['40-70k'],\n",
       " ['40-60k', '13'],\n",
       " ['14-18k', '13'],\n",
       " ['15-30k', '14'],\n",
       " ['32-37k'],\n",
       " ['30-60k'],\n",
       " ['13-18k', '13'],\n",
       " ['30-35k'],\n",
       " ['40-70k'],\n",
       " ['45-55k'],\n",
       " ['70-100k'],\n",
       " ['40-70k', '18'],\n",
       " ['12-25k'],\n",
       " ['20-25k'],\n",
       " ['20-25k'],\n",
       " ['20-21k']]"
      ]
     },
     "execution_count": 50,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "非薪资面议_detail = 非薪资面议['薪资'].apply(lambda x:x.split('薪')[0].split('·')).tolist()\r\n",
    "非薪资面议_detail"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:08:28.362691Z",
     "iopub.status.busy": "2023-06-14T10:08:28.361977Z",
     "iopub.status.idle": "2023-06-14T10:08:28.367328Z",
     "shell.execute_reply": "2023-06-14T10:08:28.366657Z",
     "shell.execute_reply.started": "2023-06-14T10:08:28.362660Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "13.541666666666666"
      ]
     },
     "execution_count": 51,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "(10+15)/2*13/12"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:08:37.239603Z",
     "iopub.status.busy": "2023-06-14T10:08:37.238591Z",
     "iopub.status.idle": "2023-06-14T10:08:37.246976Z",
     "shell.execute_reply": "2023-06-14T10:08:37.246315Z",
     "shell.execute_reply.started": "2023-06-14T10:08:37.239561Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[32.5,\n",
       " 50.0,\n",
       " 55.0,\n",
       " 45.0,\n",
       " 42.5,\n",
       " 52.5,\n",
       " 31.5,\n",
       " 75.0,\n",
       " 27.5,\n",
       " 50.0,\n",
       " 50.0,\n",
       " 20.0,\n",
       " 65.0,\n",
       " 25.0,\n",
       " 450.0,\n",
       " 40.0,\n",
       " 37.5,\n",
       " 37.5,\n",
       " 26.0,\n",
       " 45.0,\n",
       " 50.0,\n",
       " 45.0,\n",
       " 25.0,\n",
       " 40.0,\n",
       " 35.0,\n",
       " 58.3,\n",
       " 37.5,\n",
       " 26.2,\n",
       " 37.5,\n",
       " 45.0,\n",
       " 32.5,\n",
       " 29.8,\n",
       " 22.5,\n",
       " 34.4,\n",
       " 1.5,\n",
       " 113.3,\n",
       " 100.0,\n",
       " 155.8,\n",
       " 40.0,\n",
       " 20.0,\n",
       " 20.0,\n",
       " 45.0,\n",
       " 15.5,\n",
       " 24.4,\n",
       " 65.0,\n",
       " 93.8,\n",
       " 185.0,\n",
       " 22.5,\n",
       " 40.6,\n",
       " 45.0,\n",
       " 85.0,\n",
       " 45.0,\n",
       " 113.3,\n",
       " 21.5,\n",
       " 90.0,\n",
       " 50.0,\n",
       " 46.7,\n",
       " 55.0,\n",
       " 27.5,\n",
       " 22.5,\n",
       " 32.5,\n",
       " 25.0,\n",
       " 53.3,\n",
       " 5.0,\n",
       " 18.0,\n",
       " 22.5,\n",
       " 35.0,\n",
       " 22.5,\n",
       " 13.0,\n",
       " 52.7,\n",
       " 27.5,\n",
       " 34.4,\n",
       " 55.0,\n",
       " 54.2,\n",
       " 17.3,\n",
       " 26.2,\n",
       " 34.5,\n",
       " 45.0,\n",
       " 16.8,\n",
       " 32.5,\n",
       " 55.0,\n",
       " 50.0,\n",
       " 85.0,\n",
       " 82.5,\n",
       " 18.5,\n",
       " 22.5,\n",
       " 22.5,\n",
       " 20.5]"
      ]
     },
     "execution_count": 52,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "平均薪资 = [ (int(i[0].split('-')[0]) +int(i[0].split('-')[1].split('k')[0]))/2    \\\r\n",
    " if len(i)==1 else round((int(i[0].split('-')[0]) +int(i[0].split('-')[1].split('k')[0]))/2*int(i[1])/12,1)     \\\r\n",
    " for i in 非薪资面议_detail        ] \r\n",
    "平均薪资"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:08:57.329199Z",
     "iopub.status.busy": "2023-06-14T10:08:57.328109Z",
     "iopub.status.idle": "2023-06-14T10:08:57.334605Z",
     "shell.execute_reply": "2023-06-14T10:08:57.333725Z",
     "shell.execute_reply.started": "2023-06-14T10:08:57.329150Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "88"
      ]
     },
     "execution_count": 53,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(平均薪资)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 54,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:09:11.469328Z",
     "iopub.status.busy": "2023-06-14T10:09:11.468460Z",
     "iopub.status.idle": "2023-06-14T10:09:11.474445Z",
     "shell.execute_reply": "2023-06-14T10:09:11.473724Z",
     "shell.execute_reply.started": "2023-06-14T10:09:11.469295Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/opt/conda/envs/python35-paddle120-env/lib/python3.7/site-packages/ipykernel_launcher.py:1: SettingWithCopyWarning: \r\n",
      "A value is trying to be set on a copy of a slice from a DataFrame.\r\n",
      "Try using .loc[row_indexer,col_indexer] = value instead\r\n",
      "\r\n",
      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\r\n",
      "  \"\"\"Entry point for launching an IPython kernel.\r\n"
     ]
    }
   ],
   "source": [
    "非薪资面议['平均薪资']=平均薪资"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:10:28.946507Z",
     "iopub.status.busy": "2023-06-14T10:10:28.945582Z",
     "iopub.status.idle": "2023-06-14T10:10:28.970157Z",
     "shell.execute_reply": "2023-06-14T10:10:28.969336Z",
     "shell.execute_reply.started": "2023-06-14T10:10:28.946475Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位标签</th>\n",
       "      <th>职位更新时间</th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>是否top职位</th>\n",
       "      <th>工作年限</th>\n",
       "      <th>学历</th>\n",
       "      <th>公司融资情况</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>行业</th>\n",
       "      <th>规模</th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>产品经理 (Senior) Product Manager</td>\n",
       "      <td>25-40k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>32.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230602174402</td>\n",
       "      <td>产品市场经理 Product Marketing Manager</td>\n",
       "      <td>40-60k</td>\n",
       "      <td>香港-观塘区</td>\n",
       "      <td>False</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>KPay merchant service limited</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>50.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230206145433</td>\n",
       "      <td>Product Manager - Transaction</td>\n",
       "      <td>40-70k</td>\n",
       "      <td>香港-中西区</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>本科</td>\n",
       "      <td>C轮</td>\n",
       "      <td>多点生活(中国)网络科技有限公司</td>\n",
       "      <td>电子商务</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>55.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230331182809</td>\n",
       "      <td>Product Manager (AD to Dir)</td>\n",
       "      <td>30-60k</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>已上市</td>\n",
       "      <td>某国内基金证券上市公司</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>NaN</td>\n",
       "      <td>45.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230413145802</td>\n",
       "      <td>Product Manager (AD to Dir)</td>\n",
       "      <td>30-55k</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>学历不限</td>\n",
       "      <td>已上市</td>\n",
       "      <td>某国内基金/证券/期货上市公司</td>\n",
       "      <td>基金/证券/期货</td>\n",
       "      <td>NaN</td>\n",
       "      <td>42.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>104</th>\n",
       "      <td>[]</td>\n",
       "      <td>20230522113042</td>\n",
       "      <td>风险合规经理（离岸财富管理产品）</td>\n",
       "      <td>40-70k·18薪</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>某公募基金理财子公司</td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>82.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>105</th>\n",
       "      <td>['本科']</td>\n",
       "      <td>20210223134718</td>\n",
       "      <td>产品经理</td>\n",
       "      <td>12-25k</td>\n",
       "      <td>香港-湾仔区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>华润数科控股有限公司</td>\n",
       "      <td>人工智能</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>18.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>106</th>\n",
       "      <td>['本科', '功能测试', '软件测试']</td>\n",
       "      <td>20230613110233</td>\n",
       "      <td>软件测试应届生（23届）</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>成都无敌勇士科技有限公司</td>\n",
       "      <td>游戏</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>22.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>107</th>\n",
       "      <td>['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']</td>\n",
       "      <td>20230506100220</td>\n",
       "      <td>APP测试工程师</td>\n",
       "      <td>20-25k</td>\n",
       "      <td>香港-东区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>Winner Studio</td>\n",
       "      <td>游戏</td>\n",
       "      <td>NaN</td>\n",
       "      <td>22.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>108</th>\n",
       "      <td>['本科']</td>\n",
       "      <td>20230614100413</td>\n",
       "      <td>Graduate Engineer (Civil and MEP Engineering)</td>\n",
       "      <td>20-21k</td>\n",
       "      <td>香港-油尖旺区</td>\n",
       "      <td>False</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>阿特金斯</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>20.5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>88 rows × 13 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 职位标签          职位更新时间  \\\n",
       "1        ['IT互联网', 'SaaS产品', 'to B', '产品设计', '移动端产品']  20230602174402   \n",
       "2                                                  []  20230602174402   \n",
       "5                                                  []  20230206145433   \n",
       "6                                                  []  20230331182809   \n",
       "7                                                  []  20230413145802   \n",
       "..                                                ...             ...   \n",
       "104                                                []  20230522113042   \n",
       "105                                            ['本科']  20210223134718   \n",
       "106                            ['本科', '功能测试', '软件测试']  20230613110233   \n",
       "107  ['本科', '软件测试', '应用测试', '功能测试', 'iOS', 'Android']  20230506100220   \n",
       "108                                            ['本科']  20230614100413   \n",
       "\n",
       "                                                职位          薪资       地区  \\\n",
       "1                    产品经理 (Senior) Product Manager      25-40k   香港-观塘区   \n",
       "2                 产品市场经理 Product Marketing Manager      40-60k   香港-观塘区   \n",
       "5                    Product Manager - Transaction      40-70k   香港-中西区   \n",
       "6                      Product Manager (AD to Dir)      30-60k       香港   \n",
       "7                      Product Manager (AD to Dir)      30-55k       香港   \n",
       "..                                             ...         ...      ...   \n",
       "104                               风险合规经理（离岸财富管理产品）  40-70k·18薪       香港   \n",
       "105                                           产品经理      12-25k   香港-湾仔区   \n",
       "106                                   软件测试应届生（23届）      20-25k       香港   \n",
       "107                                       APP测试工程师      20-25k    香港-东区   \n",
       "108  Graduate Engineer (Civil and MEP Engineering)      20-21k  香港-油尖旺区   \n",
       "\n",
       "     是否top职位   工作年限     学历 公司融资情况                           公司名称        行业  \\\n",
       "1      False  5-10年     本科    NaN  KPay merchant service limited      科技金融   \n",
       "2      False   3-5年     本科    NaN  KPay merchant service limited      科技金融   \n",
       "5      False  5-10年     本科     C轮               多点生活(中国)网络科技有限公司      电子商务   \n",
       "6      False  5-10年  本科及以上    已上市                    某国内基金证券上市公司  基金/证券/期货   \n",
       "7      False  5-10年   学历不限    已上市                某国内基金/证券/期货上市公司  基金/证券/期货   \n",
       "..       ...    ...    ...    ...                            ...       ...   \n",
       "104    False  5-10年  硕士及以上  融资未公开                     某公募基金理财子公司  基金/证券/投资   \n",
       "105    False    NaN    NaN    NaN                     华润数科控股有限公司      人工智能   \n",
       "106    False    NaN    NaN  融资未公开                   成都无敌勇士科技有限公司        游戏   \n",
       "107    False    NaN    NaN    NaN                  Winner Studio        游戏   \n",
       "108    False    NaN    NaN    NaN                           阿特金斯   房地产开发经营   \n",
       "\n",
       "             规模  平均薪资  \n",
       "1        50-99人  32.5  \n",
       "2        50-99人  50.0  \n",
       "5    2000-5000人  55.0  \n",
       "6           NaN  45.0  \n",
       "7           NaN  42.5  \n",
       "..          ...   ...  \n",
       "104    500-999人  82.5  \n",
       "105  2000-5000人  18.5  \n",
       "106    100-499人  22.5  \n",
       "107         NaN  22.5  \n",
       "108    100-499人  20.5  \n",
       "\n",
       "[88 rows x 13 columns]"
      ]
     },
     "execution_count": 55,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "非薪资面议"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:10:50.204677Z",
     "iopub.status.busy": "2023-06-14T10:10:50.203707Z",
     "iopub.status.idle": "2023-06-14T10:10:50.217601Z",
     "shell.execute_reply": "2023-06-14T10:10:50.216579Z",
     "shell.execute_reply.started": "2023-06-14T10:10:50.204644Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>地区</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>香港</th>\n",
       "      <td>45.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-东区</th>\n",
       "      <td>55.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-中西区</th>\n",
       "      <td>55.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-九龙城区</th>\n",
       "      <td>54.20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-元朗区</th>\n",
       "      <td>17.05</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-沙田区</th>\n",
       "      <td>26.20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-油尖旺区</th>\n",
       "      <td>24.40</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-深水埗区</th>\n",
       "      <td>32.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-湾仔区</th>\n",
       "      <td>35.95</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-荃湾区</th>\n",
       "      <td>65.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-葵青区</th>\n",
       "      <td>26.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-西贡区</th>\n",
       "      <td>35.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>香港-观塘区</th>\n",
       "      <td>50.00</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "          平均薪资\n",
       "地区            \n",
       "香港       45.00\n",
       "香港-东区    55.00\n",
       "香港-中西区   55.00\n",
       "香港-九龙城区  54.20\n",
       "香港-元朗区   17.05\n",
       "香港-沙田区   26.20\n",
       "香港-油尖旺区  24.40\n",
       "香港-深水埗区  32.50\n",
       "香港-湾仔区   35.95\n",
       "香港-荃湾区   65.00\n",
       "香港-葵青区   26.75\n",
       "香港-西贡区   35.00\n",
       "香港-观塘区   50.00"
      ]
     },
     "execution_count": 56,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 分地区平均薪资\r\n",
    "分地区_平均薪资 = 非薪资面议.groupby('地区').agg({'平均薪资':'median'})\r\n",
    "分地区_平均薪资"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:11:04.685089Z",
     "iopub.status.busy": "2023-06-14T10:11:04.684457Z",
     "iopub.status.idle": "2023-06-14T10:11:04.691665Z",
     "shell.execute_reply": "2023-06-14T10:11:04.690593Z",
     "shell.execute_reply.started": "2023-06-14T10:11:04.685057Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['香港',\n",
       " '香港-东区',\n",
       " '香港-中西区',\n",
       " '香港-九龙城区',\n",
       " '香港-元朗区',\n",
       " '香港-沙田区',\n",
       " '香港-油尖旺区',\n",
       " '香港-深水埗区',\n",
       " '香港-湾仔区',\n",
       " '香港-荃湾区',\n",
       " '香港-葵青区',\n",
       " '香港-西贡区',\n",
       " '香港-观塘区']"
      ]
     },
     "execution_count": 57,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "分地区_平均薪资_index = 分地区_平均薪资.index.tolist()\r\n",
    "分地区_平均薪资_index"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-05-31T12:49:38.320051Z",
     "iopub.status.busy": "2023-05-31T12:49:38.319395Z",
     "iopub.status.idle": "2023-05-31T12:49:38.329927Z",
     "shell.execute_reply": "2023-05-31T12:49:38.329058Z",
     "shell.execute_reply.started": "2023-05-31T12:49:38.320016Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "<script>\n",
       "    require.config({\n",
       "        paths: {\n",
       "            'echarts':'https://assets.pyecharts.org/assets/v5/echarts.min'\n",
       "        }\n",
       "    });\n",
       "</script>\n",
       "\n",
       "        <div id=\"b11ef788263b4c649c6e902474e0d438\" style=\"width:900px; height:500px;\"></div>\n",
       "\n",
       "<script>\n",
       "        require(['echarts'], function(echarts) {\n",
       "                var chart_b11ef788263b4c649c6e902474e0d438 = echarts.init(\n",
       "                    document.getElementById('b11ef788263b4c649c6e902474e0d438'), 'white', {renderer: 'canvas'});\n",
       "                var option_b11ef788263b4c649c6e902474e0d438 = {\n",
       "    \"animation\": true,\n",
       "    \"animationThreshold\": 2000,\n",
       "    \"animationDuration\": 1000,\n",
       "    \"animationEasing\": \"cubicOut\",\n",
       "    \"animationDelay\": 0,\n",
       "    \"animationDurationUpdate\": 300,\n",
       "    \"animationEasingUpdate\": \"cubicOut\",\n",
       "    \"animationDelayUpdate\": 0,\n",
       "    \"aria\": {\n",
       "        \"enabled\": false\n",
       "    },\n",
       "    \"color\": [\n",
       "        \"#5470c6\",\n",
       "        \"#91cc75\",\n",
       "        \"#fac858\",\n",
       "        \"#ee6666\",\n",
       "        \"#73c0de\",\n",
       "        \"#3ba272\",\n",
       "        \"#fc8452\",\n",
       "        \"#9a60b4\",\n",
       "        \"#ea7ccc\"\n",
       "    ],\n",
       "    \"series\": [\n",
       "        {\n",
       "            \"type\": \"bar\",\n",
       "            \"name\": \"\\u5730\\u533a\",\n",
       "            \"legendHoverLink\": true,\n",
       "            \"data\": [\n",
       "                42.5,\n",
       "                20.8,\n",
       "                20.0,\n",
       "                24.0,\n",
       "                20.5,\n",
       "                27.5,\n",
       "                17.5,\n",
       "                27.5\n",
       "            ],\n",
       "            \"realtimeSort\": false,\n",
       "            \"showBackground\": false,\n",
       "            \"stackStrategy\": \"samesign\",\n",
       "            \"cursor\": \"pointer\",\n",
       "            \"barMinHeight\": 0,\n",
       "            \"barCategoryGap\": \"20%\",\n",
       "            \"barGap\": \"30%\",\n",
       "            \"large\": false,\n",
       "            \"largeThreshold\": 400,\n",
       "            \"seriesLayoutBy\": \"column\",\n",
       "            \"datasetIndex\": 0,\n",
       "            \"clip\": true,\n",
       "            \"zlevel\": 0,\n",
       "            \"z\": 2,\n",
       "            \"label\": {\n",
       "                \"show\": true,\n",
       "                \"margin\": 8\n",
       "            }\n",
       "        }\n",
       "    ],\n",
       "    \"legend\": [\n",
       "        {\n",
       "            \"data\": [\n",
       "                \"\\u5730\\u533a\"\n",
       "            ],\n",
       "            \"selected\": {},\n",
       "            \"show\": true,\n",
       "            \"padding\": 5,\n",
       "            \"itemGap\": 10,\n",
       "            \"itemWidth\": 25,\n",
       "            \"itemHeight\": 14,\n",
       "            \"backgroundColor\": \"transparent\",\n",
       "            \"borderColor\": \"#ccc\",\n",
       "            \"borderWidth\": 1,\n",
       "            \"borderRadius\": 0,\n",
       "            \"pageButtonItemGap\": 5,\n",
       "            \"pageButtonPosition\": \"end\",\n",
       "            \"pageFormatter\": \"{current}/{total}\",\n",
       "            \"pageIconColor\": \"#2f4554\",\n",
       "            \"pageIconInactiveColor\": \"#aaa\",\n",
       "            \"pageIconSize\": 15,\n",
       "            \"animationDurationUpdate\": 800,\n",
       "            \"selector\": false,\n",
       "            \"selectorPosition\": \"auto\",\n",
       "            \"selectorItemGap\": 7,\n",
       "            \"selectorButtonGap\": 10\n",
       "        }\n",
       "    ],\n",
       "    \"tooltip\": {\n",
       "        \"show\": true,\n",
       "        \"trigger\": \"item\",\n",
       "        \"triggerOn\": \"mousemove|click\",\n",
       "        \"axisPointer\": {\n",
       "            \"type\": \"line\"\n",
       "        },\n",
       "        \"showContent\": true,\n",
       "        \"alwaysShowContent\": false,\n",
       "        \"showDelay\": 0,\n",
       "        \"hideDelay\": 100,\n",
       "        \"enterable\": false,\n",
       "        \"confine\": false,\n",
       "        \"appendToBody\": false,\n",
       "        \"transitionDuration\": 0.4,\n",
       "        \"textStyle\": {\n",
       "            \"fontSize\": 14\n",
       "        },\n",
       "        \"borderWidth\": 0,\n",
       "        \"padding\": 5,\n",
       "        \"order\": \"seriesAsc\"\n",
       "    },\n",
       "    \"xAxis\": [\n",
       "        {\n",
       "            \"show\": true,\n",
       "            \"scale\": false,\n",
       "            \"nameLocation\": \"end\",\n",
       "            \"nameGap\": 15,\n",
       "            \"gridIndex\": 0,\n",
       "            \"inverse\": false,\n",
       "            \"offset\": 0,\n",
       "            \"splitNumber\": 5,\n",
       "            \"minInterval\": 0,\n",
       "            \"splitLine\": {\n",
       "                \"show\": true,\n",
       "                \"lineStyle\": {\n",
       "                    \"show\": true,\n",
       "                    \"width\": 1,\n",
       "                    \"opacity\": 1,\n",
       "                    \"curveness\": 0,\n",
       "                    \"type\": \"solid\"\n",
       "                }\n",
       "            },\n",
       "            \"data\": [\n",
       "                \"\\u5357\\u6c99\\u533a\",\n",
       "                \"\\u5929\\u6cb3\\u533a\",\n",
       "                \"\\u6d77\\u73e0\\u533a\",\n",
       "                \"\\u756a\\u79ba\\u533a\",\n",
       "                \"\\u767d\\u4e91\\u533a\",\n",
       "                \"\\u8354\\u6e7e\\u533a\",\n",
       "                \"\\u8d8a\\u79c0\\u533a\",\n",
       "                \"\\u9ec4\\u57d4\\u533a\"\n",
       "            ]\n",
       "        }\n",
       "    ],\n",
       "    \"yAxis\": [\n",
       "        {\n",
       "            \"show\": true,\n",
       "            \"scale\": false,\n",
       "            \"nameLocation\": \"end\",\n",
       "            \"nameGap\": 15,\n",
       "            \"gridIndex\": 0,\n",
       "            \"inverse\": false,\n",
       "            \"offset\": 0,\n",
       "            \"splitNumber\": 5,\n",
       "            \"minInterval\": 0,\n",
       "            \"splitLine\": {\n",
       "                \"show\": true,\n",
       "                \"lineStyle\": {\n",
       "                    \"show\": true,\n",
       "                    \"width\": 1,\n",
       "                    \"opacity\": 1,\n",
       "                    \"curveness\": 0,\n",
       "                    \"type\": \"solid\"\n",
       "                }\n",
       "            }\n",
       "        }\n",
       "    ],\n",
       "    \"title\": [\n",
       "        {\n",
       "            \"show\": true,\n",
       "            \"text\": \"PM-\\u5206\\u5730\\u533a-\\u4e2d\\u4f4d\\u6570\\u85aa\\u8d44\",\n",
       "            \"target\": \"blank\",\n",
       "            \"subtarget\": \"blank\",\n",
       "            \"padding\": 5,\n",
       "            \"itemGap\": 10,\n",
       "            \"textAlign\": \"auto\",\n",
       "            \"textVerticalAlign\": \"auto\",\n",
       "            \"triggerEvent\": false\n",
       "        }\n",
       "    ],\n",
       "    \"brush\": {\n",
       "        \"toolbox\": [\n",
       "            \"rect\",\n",
       "            \"polygon\",\n",
       "            \"keep\",\n",
       "            \"clear\"\n",
       "        ],\n",
       "        \"brushType\": \"rect\",\n",
       "        \"brushMode\": \"single\",\n",
       "        \"transformable\": true,\n",
       "        \"brushStyle\": {\n",
       "            \"borderWidth\": 1,\n",
       "            \"color\": \"rgba(120,140,180,0.3)\",\n",
       "            \"borderColor\": \"rgba(120,140,180,0.8)\"\n",
       "        },\n",
       "        \"throttleType\": \"fixRate\",\n",
       "        \"throttleDelay\": 0,\n",
       "        \"removeOnClick\": true,\n",
       "        \"z\": 10000\n",
       "    }\n",
       "};\n",
       "                chart_b11ef788263b4c649c6e902474e0d438.setOption(option_b11ef788263b4c649c6e902474e0d438);\n",
       "        });\n",
       "    </script>\n"
      ],
      "text/plain": [
       "<pyecharts.render.display.HTML at 0x7fa35932dd50>"
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from pyecharts import options as opts\n",
    "from pyecharts.charts import Bar\n",
    "from pyecharts.faker import Faker\n",
    "\n",
    "\n",
    "c = (\n",
    "    Bar()\n",
    "    .add_xaxis([i.split('-')[1] for i in 分地区_平均薪资_index[1:]])\n",
    "    .add_yaxis(\"地区\", 分地区_平均薪资_values[1:])\n",
    "    .set_global_opts(\n",
    "        title_opts=opts.TitleOpts(title=\"PM-分地区-中位数薪资\"),\n",
    "        brush_opts=opts.BrushOpts(),\n",
    "    )\n",
    "    # .render(\"bar_with_brush.html\")\n",
    ")\n",
    "c.render_notebook()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 59,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:17:42.511789Z",
     "iopub.status.busy": "2023-06-14T10:17:42.511259Z",
     "iopub.status.idle": "2023-06-14T10:17:42.524614Z",
     "shell.execute_reply": "2023-06-14T10:17:42.523762Z",
     "shell.execute_reply.started": "2023-06-14T10:17:42.511756Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>工作年限</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1-3年</th>\n",
       "      <td>22.800000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10年以上</th>\n",
       "      <td>58.700000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3-5年</th>\n",
       "      <td>40.716000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5-10年</th>\n",
       "      <td>49.361111</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>经验不限</th>\n",
       "      <td>76.557143</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "            平均薪资\n",
       "工作年限            \n",
       "1-3年   22.800000\n",
       "10年以上  58.700000\n",
       "3-5年   40.716000\n",
       "5-10年  49.361111\n",
       "经验不限   76.557143"
      ]
     },
     "execution_count": 59,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_year_salary = 非薪资面议.groupby('工作年限').agg({'平均薪资':'mean'})\r\n",
    "df_year_salary"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 60,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:18:00.492046Z",
     "iopub.status.busy": "2023-06-14T10:18:00.491509Z",
     "iopub.status.idle": "2023-06-14T10:18:00.506731Z",
     "shell.execute_reply": "2023-06-14T10:18:00.505948Z",
     "shell.execute_reply.started": "2023-06-14T10:18:00.492015Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>工作年限</th>\n",
       "      <th>学历</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1-3年</th>\n",
       "      <th>本科</th>\n",
       "      <td>22.800000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">10年以上</th>\n",
       "      <th>本科及以上</th>\n",
       "      <td>64.900000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>统招本科</th>\n",
       "      <td>52.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">3-5年</th>\n",
       "      <th>博士</th>\n",
       "      <td>93.800000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>学历不限</th>\n",
       "      <td>54.200000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>本科</th>\n",
       "      <td>35.830000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>本科及以上</th>\n",
       "      <td>41.650000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>硕士</th>\n",
       "      <td>27.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>统招本科</th>\n",
       "      <td>40.080000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"5\" valign=\"top\">5-10年</th>\n",
       "      <th>学历不限</th>\n",
       "      <td>59.583333</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>本科</th>\n",
       "      <td>38.436364</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>本科及以上</th>\n",
       "      <td>65.266667</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>硕士及以上</th>\n",
       "      <td>83.750000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>统招本科</th>\n",
       "      <td>70.200000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"4\" valign=\"top\">经验不限</th>\n",
       "      <th>大专</th>\n",
       "      <td>17.300000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>学历不限</th>\n",
       "      <td>51.450000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>本科及以上</th>\n",
       "      <td>267.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>统招本科</th>\n",
       "      <td>5.000000</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                   平均薪资\n",
       "工作年限  学历               \n",
       "1-3年  本科      22.800000\n",
       "10年以上 本科及以上   64.900000\n",
       "      统招本科    52.500000\n",
       "3-5年  博士      93.800000\n",
       "      学历不限    54.200000\n",
       "      本科      35.830000\n",
       "      本科及以上   41.650000\n",
       "      硕士      27.500000\n",
       "      统招本科    40.080000\n",
       "5-10年 学历不限    59.583333\n",
       "      本科      38.436364\n",
       "      本科及以上   65.266667\n",
       "      硕士及以上   83.750000\n",
       "      统招本科    70.200000\n",
       "经验不限  大专      17.300000\n",
       "      学历不限    51.450000\n",
       "      本科及以上  267.500000\n",
       "      统招本科     5.000000"
      ]
     },
     "execution_count": 60,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 分工作时间和学历平均薪资\r\n",
    "df_year_edulevel =  非薪资面议.groupby(['工作年限','学历']).agg({'平均薪资':'mean'})\r\n",
    "df_year_edulevel"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:18:15.475670Z",
     "iopub.status.busy": "2023-06-14T10:18:15.474753Z",
     "iopub.status.idle": "2023-06-14T10:18:15.489049Z",
     "shell.execute_reply": "2023-06-14T10:18:15.487906Z",
     "shell.execute_reply.started": "2023-06-14T10:18:15.475633Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>行业</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>IT服务</th>\n",
       "      <td>33.750000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>专业技术服务</th>\n",
       "      <td>106.650000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>互联网</th>\n",
       "      <td>38.812500</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>人力资源服务</th>\n",
       "      <td>15.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>人工智能</th>\n",
       "      <td>18.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>其他商务服务业</th>\n",
       "      <td>43.333333</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>印刷/包装/造纸</th>\n",
       "      <td>45.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>咨询服务</th>\n",
       "      <td>97.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>基金/证券/投资</th>\n",
       "      <td>67.260000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>基金/证券/期货</th>\n",
       "      <td>67.929412</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>工程管理/勘察/监理</th>\n",
       "      <td>16.166667</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>房地产开发经营</th>\n",
       "      <td>20.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>房地产租赁/中介</th>\n",
       "      <td>90.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>智能硬件</th>\n",
       "      <td>25.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>服装/纺织/皮革</th>\n",
       "      <td>29.450000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>检测/认证</th>\n",
       "      <td>31.250000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>游戏</th>\n",
       "      <td>22.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>珠宝/首饰</th>\n",
       "      <td>22.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>电子商务</th>\n",
       "      <td>65.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>科技金融</th>\n",
       "      <td>36.650000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>融资租赁</th>\n",
       "      <td>155.800000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>计算机软件</th>\n",
       "      <td>39.360000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>财务/审计/税务</th>\n",
       "      <td>34.400000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>运营商/增值服务</th>\n",
       "      <td>24.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>通信设备</th>\n",
       "      <td>37.885714</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>银行</th>\n",
       "      <td>31.500000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>食品/饮料/酒水</th>\n",
       "      <td>34.900000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>餐饮业</th>\n",
       "      <td>37.500000</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                  平均薪资\n",
       "行业                    \n",
       "IT服务         33.750000\n",
       "专业技术服务      106.650000\n",
       "互联网          38.812500\n",
       "人力资源服务       15.000000\n",
       "人工智能         18.500000\n",
       "其他商务服务业      43.333333\n",
       "印刷/包装/造纸     45.000000\n",
       "咨询服务         97.500000\n",
       "基金/证券/投资     67.260000\n",
       "基金/证券/期货     67.929412\n",
       "工程管理/勘察/监理   16.166667\n",
       "房地产开发经营      20.500000\n",
       "房地产租赁/中介     90.000000\n",
       "智能硬件         25.000000\n",
       "服装/纺织/皮革     29.450000\n",
       "检测/认证        31.250000\n",
       "游戏           22.500000\n",
       "珠宝/首饰        22.500000\n",
       "电子商务         65.000000\n",
       "科技金融         36.650000\n",
       "融资租赁        155.800000\n",
       "计算机软件        39.360000\n",
       "财务/审计/税务     34.400000\n",
       "运营商/增值服务     24.500000\n",
       "通信设备         37.885714\n",
       "银行           31.500000\n",
       "食品/饮料/酒水     34.900000\n",
       "餐饮业          37.500000"
      ]
     },
     "execution_count": 61,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 分行业\r\n",
    "df_industry = 非薪资面议.groupby('行业').agg({'平均薪资':'mean'})\r\n",
    "df_industry"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {
    "execution": {
     "iopub.execute_input": "2023-06-14T10:18:40.622744Z",
     "iopub.status.busy": "2023-06-14T10:18:40.621474Z",
     "iopub.status.idle": "2023-06-14T10:18:40.664987Z",
     "shell.execute_reply": "2023-06-14T10:18:40.663775Z",
     "shell.execute_reply.started": "2023-06-14T10:18:40.622704Z"
    },
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "with pd.ExcelWriter(key+'_'+output_time+'_.xlsx') as writer:  \r\n",
    "    df_year_salary.to_excel(writer, sheet_name='分工作年限平均薪资')\r\n",
    "    df_year_edulevel.to_excel(writer, sheet_name='分学历平均薪资')\r\n",
    "    df_industry.to_excel(writer, sheet_name='分行业平均薪资')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "py35-paddle1.2.0"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
